Skip to content

Commit c832eb2

Browse files
committed
Add FileChannels.contentEquals(ReadableByteChannel, ReadableByteChannel,
int) - Improve performance of IOUtils.contentEquals(InputStream, InputStream) by about 13% - Fix JMH Maven invocation - Pick up JMH version from parent POM
1 parent e09033c commit c832eb2

File tree

5 files changed

+115
-71
lines changed

5 files changed

+115
-71
lines changed

pom.xml

+19-8
Original file line numberDiff line numberDiff line change
@@ -101,13 +101,7 @@ file comparators, endian transformation classes, and much more.
101101
<dependency>
102102
<groupId>org.openjdk.jmh</groupId>
103103
<artifactId>jmh-core</artifactId>
104-
<version>${jmh.version}</version>
105-
<scope>test</scope>
106-
</dependency>
107-
<dependency>
108-
<groupId>org.openjdk.jmh</groupId>
109-
<artifactId>jmh-generator-annprocess</artifactId>
110-
<version>${jmh.version}</version>
104+
<version>${commons.jmh.version}</version>
111105
<scope>test</scope>
112106
</dependency>
113107
</dependencies>
@@ -148,7 +142,6 @@ file comparators, endian transformation classes, and much more.
148142
</commons.osgi.import>
149143
<commons.scmPubUrl>https://svn.apache.org/repos/infra/websites/production/commons/content/proper/commons-io/</commons.scmPubUrl>
150144
<commons.scmPubCheckoutDirectory>site-content</commons.scmPubCheckoutDirectory>
151-
<jmh.version>1.37</jmh.version>
152145
<commons.bytebuddy.version>1.17.2</commons.bytebuddy.version>
153146
<japicmp.skip>false</japicmp.skip>
154147
<commons.release.isDistModule>true</commons.release.isDistModule>
@@ -357,13 +350,31 @@ file comparators, endian transformation classes, and much more.
357350
</properties>
358351
</profile>
359352
<profile>
353+
<!-- Profile to build and run the benchmarks. Use 'mvn test -Pbenchmark', and add '-Dbenchmark=foo' to run only the foo benchmark -->
360354
<id>benchmark</id>
355+
<dependencies>
356+
<dependency>
357+
<groupId>org.openjdk.jmh</groupId>
358+
<artifactId>jmh-generator-annprocess</artifactId>
359+
<version>${commons.jmh.version}</version>
360+
<scope>test</scope>
361+
</dependency>
362+
</dependencies>
361363
<properties>
362364
<skipTests>true</skipTests>
363365
<benchmark>org.apache</benchmark>
364366
</properties>
365367
<build>
366368
<plugins>
369+
<plugin>
370+
<artifactId>maven-compiler-plugin</artifactId>
371+
<version>${commons.compiler.version}</version>
372+
<configuration combine.self="override">
373+
<testIncludes>
374+
<testInclude>**/*</testInclude>
375+
</testIncludes>
376+
</configuration>
377+
</plugin>
367378
<plugin>
368379
<groupId>org.codehaus.mojo</groupId>
369380
<artifactId>exec-maven-plugin</artifactId>

src/changes/changes.xml

+2
Original file line numberDiff line numberDiff line change
@@ -64,6 +64,7 @@ The <action> type attribute can be add,update,fix,remove.
6464
<action dev="ggregory" type="fix" due-to="Gary Gregory">Avoid unnecessary boxing and unboxing of int values in UncheckedFilterReader.read().</action>
6565
<action dev="ggregory" type="fix" due-to="Gary Gregory">FileChannels.contentEquals(FileChannel, FileChannel, int) can return false when comparing a non-blocking channel.</action>
6666
<action dev="ggregory" type="fix" due-to="Gary Gregory">Deprecate FileChannels.contentEquals(FileChannel, FileChannel, int) in favor of FileChannels.contentEquals(SeekableByteChannel, SeekableByteChannel, int).</action>
67+
<action dev="ggregory" type="fix" due-to="Gary Gregory">Improve performance of IOUtils.contentEquals(InputStream, InputStream) by about 13%.</action>
6768
<!-- ADD -->
6869
<action dev="ggregory" type="add" issue="IO-860" due-to="Nico Strecker, Gary Gregory">Add ThrottledInputStream.Builder.setMaxBytes(long, ChronoUnit).</action>
6970
<action dev="ggregory" type="add" due-to="Gary Gregory">Add IOIterable.</action>
@@ -80,6 +81,7 @@ The <action> type attribute can be add,update,fix,remove.
8081
<action dev="ggregory" type="add" due-to="Gary Gregory">Add IOBooleanSupplier.</action>
8182
<action dev="ggregory" type="add" due-to="Gary Gregory">Add Uncheck.getAsBoolean(IOBooleanSupplier).</action>
8283
<action dev="ggregory" type="add" due-to="Gary Gregory">Add FileChannels.contentEquals(SeekableByteChannel, SeekableByteChannel, int).</action>
84+
<action dev="ggregory" type="add" due-to="Gary Gregory">Add FileChannels.contentEquals(ReadableByteChannel, ReadableByteChannel, int).</action>
8385
<!-- UPDATE -->
8486
<action dev="ggregory" type="update" due-to="Dependabot, Gary Gregory">Bump commons.bytebuddy.version from 1.15.10 to 1.17.2 #710, #715, #720.</action>
8587
<action dev="ggregory" type="update" due-to="Gary Gregory">Bump commons-codec:commons-codec from 1.17.1 to 1.18.0. #717.</action>

src/main/java/org/apache/commons/io/IOUtils.java

+5-38
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,7 @@
6161
import java.util.stream.Stream;
6262
import java.util.zip.InflaterInputStream;
6363

64+
import org.apache.commons.io.channels.FileChannels;
6465
import org.apache.commons.io.function.IOConsumer;
6566
import org.apache.commons.io.function.IOSupplier;
6667
import org.apache.commons.io.function.IOTriFunction;
@@ -903,51 +904,17 @@ public static long consume(final Reader input) throws IOException {
903904
* exist, false otherwise
904905
* @throws IOException if an I/O error occurs
905906
*/
907+
@SuppressWarnings("resource") // Caller closes input streams
906908
public static boolean contentEquals(final InputStream input1, final InputStream input2) throws IOException {
907-
// Before making any changes, please test with
908-
// org.apache.commons.io.jmh.IOUtilsContentEqualsInputStreamsBenchmark
909+
// Before making any changes, please test with org.apache.commons.io.jmh.IOUtilsContentEqualsInputStreamsBenchmark
909910
if (input1 == input2) {
910911
return true;
911912
}
912913
if (input1 == null || input2 == null) {
913914
return false;
914915
}
915-
916-
// reuse one
917-
final byte[] array1 = getScratchByteArray();
918-
// allocate another
919-
final byte[] array2 = byteArray();
920-
int pos1;
921-
int pos2;
922-
int count1;
923-
int count2;
924-
while (true) {
925-
pos1 = 0;
926-
pos2 = 0;
927-
for (int index = 0; index < DEFAULT_BUFFER_SIZE; index++) {
928-
if (pos1 == index) {
929-
do {
930-
count1 = input1.read(array1, pos1, DEFAULT_BUFFER_SIZE - pos1);
931-
} while (count1 == 0);
932-
if (count1 == EOF) {
933-
return pos2 == index && input2.read() == EOF;
934-
}
935-
pos1 += count1;
936-
}
937-
if (pos2 == index) {
938-
do {
939-
count2 = input2.read(array2, pos2, DEFAULT_BUFFER_SIZE - pos2);
940-
} while (count2 == 0);
941-
if (count2 == EOF) {
942-
return pos1 == index && input1.read() == EOF;
943-
}
944-
pos2 += count2;
945-
}
946-
if (array1[index] != array2[index]) {
947-
return false;
948-
}
949-
}
950-
}
916+
// We do not close FileChannels because that closes the owning InputStream.
917+
return FileChannels.contentEquals(Channels.newChannel(input1), Channels.newChannel(input2), DEFAULT_BUFFER_SIZE);
951918
}
952919

953920
// TODO Consider making public

src/main/java/org/apache/commons/io/channels/FileChannels.java

+34-17
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@
2020
import java.io.IOException;
2121
import java.nio.ByteBuffer;
2222
import java.nio.channels.FileChannel;
23+
import java.nio.channels.ReadableByteChannel;
2324
import java.nio.channels.SeekableByteChannel;
2425
import java.util.Objects;
2526

@@ -33,10 +34,10 @@
3334
public final class FileChannels {
3435

3536
/**
36-
* Tests if two FileChannel contents are equal starting at their respective current positions.
37+
* Tests if two file channel contents are equal starting at their respective current positions.
3738
*
38-
* @param channel1 A FileChannel.
39-
* @param channel2 Another FileChannel.
39+
* @param channel1 A file channel.
40+
* @param channel2 Another file channel.
4041
* @param bufferCapacity The two internal buffer capacities, in bytes.
4142
* @return true if the contents of both RandomAccessFiles are equal, false otherwise.
4243
* @throws IOException if an I/O error occurs.
@@ -49,10 +50,6 @@ public static boolean contentEquals(final FileChannel channel1, final FileChanne
4950

5051
/**
5152
* Tests if two readable byte channel contents are equal starting at their respective current positions.
52-
* <p>
53-
* If a file channel is a non-blocking file channel, it may return 0 bytes read for any given call. In order to avoid waiting forever when trying again, a
54-
* timeout Duration can be specified, which when met, throws an IOException.
55-
* </p>
5653
*
5754
* @param channel1 A readable byte channel.
5855
* @param channel2 Another readable byte channel.
@@ -61,27 +58,20 @@ public static boolean contentEquals(final FileChannel channel1, final FileChanne
6158
* @throws IOException if an I/O error occurs or the timeout is met.
6259
* @since 2.19.0
6360
*/
64-
public static boolean contentEquals(final SeekableByteChannel channel1, final SeekableByteChannel channel2, final int bufferCapacity) throws IOException {
61+
public static boolean contentEquals(final ReadableByteChannel channel1, final ReadableByteChannel channel2, final int bufferCapacity) throws IOException {
62+
// Before making any changes, please test with org.apache.commons.io.jmh.IOUtilsContentEqualsInputStreamsBenchmark
6563
// Short-circuit test
6664
if (Objects.equals(channel1, channel2)) {
6765
return true;
6866
}
69-
// Short-circuit test
70-
final long size1 = size(channel1);
71-
final long size2 = size(channel2);
72-
if (size1 != size2) {
73-
return false;
74-
}
75-
if (size1 == 0 && size2 == 0) {
76-
return true;
77-
}
7867
// Dig in and do the work
7968
final ByteBuffer byteBuffer1 = ByteBuffer.allocateDirect(bufferCapacity);
8069
final ByteBuffer byteBuffer2 = ByteBuffer.allocateDirect(bufferCapacity);
8170
int numRead1 = 0;
8271
int numRead2 = 0;
8372
boolean read0On1 = false;
8473
boolean read0On2 = false;
74+
// If a channel is a non-blocking channel, it may return 0 bytes read for any given call.
8575
while (true) {
8676
if (!read0On2) {
8777
numRead1 = channel1.read(byteBuffer1);
@@ -110,6 +100,33 @@ public static boolean contentEquals(final SeekableByteChannel channel1, final Se
110100
}
111101
}
112102

103+
/**
104+
* Tests if two seekable byte channel contents are equal starting at their respective current positions.
105+
* <p>
106+
* If the two channels have different sizes, no content comparison takes place, and this method returns false.
107+
* </p>
108+
*
109+
* @param channel1 A seekable byte channel.
110+
* @param channel2 Another seekable byte channel.
111+
* @param bufferCapacity The two internal buffer capacities, in bytes.
112+
* @return true if the contents of both RandomAccessFiles are equal, false otherwise.
113+
* @throws IOException if an I/O error occurs or the timeout is met.
114+
* @since 2.19.0
115+
*/
116+
public static boolean contentEquals(final SeekableByteChannel channel1, final SeekableByteChannel channel2, final int bufferCapacity) throws IOException {
117+
// Short-circuit test
118+
if (Objects.equals(channel1, channel2)) {
119+
return true;
120+
}
121+
// Short-circuit test
122+
final long size1 = size(channel1);
123+
final long size2 = size(channel2);
124+
if (size1 != size2) {
125+
return false;
126+
}
127+
return size1 == 0 && size2 == 0 || contentEquals((ReadableByteChannel) channel1, channel2, bufferCapacity);
128+
}
129+
113130
private static long size(final SeekableByteChannel channel) throws IOException {
114131
return channel != null ? channel.size() : 0;
115132
}

src/test/java/org/apache/commons/io/jmh/IOUtilsContentEqualsInputStreamsBenchmark.java

+55-8
Original file line numberDiff line numberDiff line change
@@ -24,10 +24,12 @@
2424
import java.io.BufferedInputStream;
2525
import java.io.IOException;
2626
import java.io.InputStream;
27+
import java.nio.channels.Channels;
2728
import java.nio.charset.Charset;
2829
import java.util.concurrent.TimeUnit;
2930

3031
import org.apache.commons.io.IOUtils;
32+
import org.apache.commons.io.channels.FileChannels;
3133
import org.apache.commons.lang3.StringUtils;
3234
import org.openjdk.jmh.annotations.Benchmark;
3335
import org.openjdk.jmh.annotations.BenchmarkMode;
@@ -43,14 +45,19 @@
4345
/**
4446
* Test different implementations of {@link IOUtils#contentEquals(InputStream, InputStream)}.
4547
*
46-
* <pre>
47-
* IOUtilsContentEqualsInputStreamsBenchmark.testFileCurrent avgt 5 1518342.821 ▒ 201890.705 ns/op
48-
* IOUtilsContentEqualsInputStreamsBenchmark.testFilePr118 avgt 5 1578606.938 ▒ 66980.718 ns/op
49-
* IOUtilsContentEqualsInputStreamsBenchmark.testFileRelease_2_8_0 avgt 5 2439163.068 ▒ 265765.294 ns/op
50-
* IOUtilsContentEqualsInputStreamsBenchmark.testStringCurrent avgt 5 10389834700.000 ▒ 330301175.219 ns/op
51-
* IOUtilsContentEqualsInputStreamsBenchmark.testStringPr118 avgt 5 10890915400.000 ▒ 3251289634.067 ns/op
52-
* IOUtilsContentEqualsInputStreamsBenchmark.testStringRelease_2_8_0 avgt 5 12522802960.000 ▒ 111147669.527 ns/op
53-
* </pre>
48+
* <pre>{@code
49+
Benchmark Mode Cnt Score Error Units
50+
IOUtilsContentEqualsInputStreamsBenchmark.testFileChannels avgt 5 65105.350 ± 2655.812 ns/op
51+
IOUtilsContentEqualsInputStreamsBenchmark.testFileCurrent avgt 5 75452.987 ± 260.088 ns/op
52+
IOUtilsContentEqualsInputStreamsBenchmark.testFilePr118 avgt 5 74346.141 ± 2138.149 ns/op
53+
IOUtilsContentEqualsInputStreamsBenchmark.testFileRelease_2_8_0 avgt 5 157246.303 ± 215.369 ns/op
54+
IOUtilsContentEqualsInputStreamsBenchmark.testStringCurrent avgt 5 623344988.622 ± 574407721.150 ns/op
55+
IOUtilsContentEqualsInputStreamsBenchmark.testStringFileChannels avgt 5 132847058.786 ± 1760007.730 ns/op
56+
IOUtilsContentEqualsInputStreamsBenchmark.testStringPr118 avgt 5 459079096.521 ± 512827244.936 ns/op
57+
IOUtilsContentEqualsInputStreamsBenchmark.testStringRelease_2_8_0 avgt 5 2555773583.300 ± 18112219.764 ns/op
58+
59+
[INFO] Finished at: 2025-03-03T21:11:56-05:00
60+
* }</pre>
5461
*/
5562
@BenchmarkMode(Mode.AverageTime)
5663
@OutputTimeUnit(TimeUnit.NANOSECONDS)
@@ -101,6 +108,16 @@ public static boolean contentEquals_release_2_8_0(final InputStream input1, fina
101108

102109
}
103110

111+
public static boolean contentEqualsFileChannels(final InputStream input1, final InputStream input2) throws IOException {
112+
if (input1 == input2) {
113+
return true;
114+
}
115+
if (input1 == null || input2 == null) {
116+
return false;
117+
}
118+
return FileChannels.contentEquals(Channels.newChannel(input1), Channels.newChannel(input2), IOUtils.DEFAULT_BUFFER_SIZE);
119+
}
120+
104121
public static boolean contentEqualsPr118(final InputStream input1, final InputStream input2) throws IOException {
105122
if (input1 == input2) {
106123
return true;
@@ -144,6 +161,24 @@ public static boolean contentEqualsPr118(final InputStream input1, final InputSt
144161
}
145162
}
146163

164+
@Benchmark
165+
public boolean[] testFileChannels() throws IOException {
166+
final boolean[] res = new boolean[3];
167+
try (InputStream input1 = getClass().getResourceAsStream(TEST_PATH_A);
168+
InputStream input2 = getClass().getResourceAsStream(TEST_PATH_B)) {
169+
res[0] = contentEqualsFileChannels(input1, input1);
170+
}
171+
try (InputStream input1 = getClass().getResourceAsStream(TEST_PATH_A);
172+
InputStream input2 = getClass().getResourceAsStream(TEST_PATH_A)) {
173+
res[1] = contentEqualsFileChannels(input1, input2);
174+
}
175+
try (InputStream input1 = getClass().getResourceAsStream(TEST_PATH_16K_A);
176+
InputStream input2 = getClass().getResourceAsStream(TEST_PATH_16K_A_COPY)) {
177+
res[2] = contentEqualsFileChannels(input1, input2);
178+
}
179+
return res;
180+
}
181+
147182
@Benchmark
148183
public boolean[] testFileCurrent() throws IOException {
149184
final boolean[] res = new boolean[3];
@@ -210,6 +245,18 @@ public void testStringCurrent(final Blackhole blackhole) throws IOException {
210245
}
211246
}
212247

248+
@Benchmark
249+
public void testStringFileChannels(final Blackhole blackhole) throws IOException {
250+
for (int i = 0; i < 5; i++) {
251+
for (int j = 0; j < 5; j++) {
252+
try (InputStream input1 = IOUtils.toInputStream(STRINGS[i], DEFAULT_CHARSET);
253+
InputStream input2 = IOUtils.toInputStream(STRINGS[j], DEFAULT_CHARSET)) {
254+
blackhole.consume(contentEqualsFileChannels(input1, input2));
255+
}
256+
}
257+
}
258+
}
259+
213260
@Benchmark
214261
public void testStringPr118(final Blackhole blackhole) throws IOException {
215262
for (int i = 0; i < 5; i++) {

0 commit comments

Comments
 (0)