HebiRobotics
diff --git a/‎README.md‎
Lines changed: 11 additions & 9 deletions b/‎README.md‎
Lines changed: 11 additions & 9 deletions
diff --git a/‎benchmarks/README.md‎
Lines changed: 34 additions & 34 deletions b/‎benchmarks/README.md‎
Lines changed: 34 additions & 34 deletions
diff --git a/‎benchmarks/pom.xml‎
Lines changed: 10 additions & 0 deletions b/‎benchmarks/pom.xml‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎benchmarks/src/main/java/us/hebi/quickbuf/benchmarks/comparison/PackedDoublesBenchmark.java‎
Lines changed: 6 additions & 6 deletions b/‎benchmarks/src/main/java/us/hebi/quickbuf/benchmarks/comparison/PackedDoublesBenchmark.java‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎benchmarks/src/main/java/us/hebi/quickbuf/benchmarks/comparison/SbeBenchmark.java‎
Lines changed: 31 additions & 37 deletions b/‎benchmarks/src/main/java/us/hebi/quickbuf/benchmarks/comparison/SbeBenchmark.java‎
Lines changed: 31 additions & 37 deletions
@@ -231,7 +231,7 @@ msg.getMutableNestedMessage().setPrimitiveValue(0);
 <details>
 <summary>String Fields</summary><p>
 
-Java `String` objects are immutable, so the API differs from Protobuf-Java in that accessors accept `CharSequence` arguments and return `StringBuilder` objects instead. `StringBuilder` can be converted via `toString()`, but you may want to use a `StringInterner` to share references if you receive many identical strings.
+`String` types are internally stored as `Utf8String` that are lazily parsed and can be set with `CharSequence`. Since Java `String` objects are immutable, there are additional access methods to allow for decoding characters into a reusable `StringBuilder` instance, as well as for using a custom `Utf8Decoder` that can implement interning.
 
 ```proto
 // .proto
@@ -243,22 +243,24 @@ message SimpleMessage {
 ```Java
 // simplified generated code
 public final class SimpleMessage {
-    public SimpleMessage setOptionalString(CharSequence value); // copies data
+    public SimpleMessage setOptionalString(CharSequence value);
     public SimpleMessage clearOptionalString(); // sets length = 0
     public boolean hasOptionalString();
-    public StringBuilder getOptionalString(); // internal store -> treat as read-only
-    public StringBuilder getMutableOptionalString(); // internal store -> may be modified 
+    public String getOptionalString(); // lazily converted string
+    public Utf8String getOptionalStringBytes(); // internal representation -> treat as read-only
+    public Utf8String getMutableOptionalStringBytes(); // internal representation -> may be modified until has state is cleared
 
     private final StringBuilder optionalString = new StringBuilder(0);
 }
 ```
 
 ```Java
-// Set and append to a string field
-SimpleMessage msg = SimpleMessage.newInstance();
-msg.setOptionalString("my-");
-msg.getMutableOptionalString()
-    .append("text"); // field is now 'my-text'
+// Get characters
+SimpleMessage msg = SimpleMessage.newInstance()
+    .setOptionalString("my-text");
+
+StringBuilder chars = new StringBuilder();
+msg.getOptionalStringBytes().getChars(chars); // chars now contains "my-text"
 ```
 
 </p></details> 
 
@@ -11,47 +11,47 @@ The first benchmark was copied from [Small Binary Encoding's](https://mechanical
 
 | Test [msg/ms] | QuickBuffers | Protobuf-Java | Ratio
 | :----------- | :-----------: | :-----------: | :-----------: |
-| Car Encode  | 2808 (375 MB/s) | 985 (132 MB/s) |  2.9  
-| Car Decode  | 2266 (303 MB/s) | 1271 (170 MB/s) |  1.8  
-| Market Data Encode  | 8163 (498 MB/s) | 3700 (226 MB/s) |  2.2  
-| Market Data Decode  | 7535 (460 MB/s) | 3306 (202 MB/s) |  2.3  
+| Car Encode  | 3649 (487 MB/s) | 985 (132 MB/s) |  3.7  
+| Car Decode  | 2329 (311 MB/s) | 1271 (170 MB/s) |  1.8  
+| Market Data Encode  | 13177 (804 MB/s) | 3700 (226 MB/s) |  3.6  
+| Market Data Decode  | 9805 (598 MB/s) | 3306 (202 MB/s) |  3.0  
 
-Note that this test was done using the original SBE .proto definitions. If the varint types are changed to a less expensive encoding, e.g., `fixed64/32` instead of `int64/32`, the market data numbers improve by another 10-20%. By additionally inlining the small nested fields it'd result in 3-4x the original message throughput of Protobuf-Java. The choice of type can have a huge impact on the performance.
+Note that this test was done using the original SBE .proto definitions. If the varint types are changed to a less expensive encoding, e.g., `fixed64/32` instead of `int64/32`, the results improve by 30-50%. By additionally inlining the small nested fields it'd result in more than 5x the original message throughput. Overall, be aware that there is a significant trade-off between wire size and encoding speed.
 
-We also compared the built-in JSON encoding and found that for this particular benchmark the message throughput is roughly the same as Protobuf-Java. However, at 559 byte (car) and 435 byte (market) the uncompressed binary sizes are significantly larger.
+We also compared the built-in JSON encoding and found that for this particular benchmark the message throughput is on par with Protobuf-Java. However, at 559 byte (car) and 435 byte (market) the uncompressed binary sizes are significantly larger.
 
 <!-- car mutliplier: 559 * 1000 / (1024*1024) = 0.5331 = -->
 <!-- market multiplier: 435 * 1000 / (1024*1024) = 0.415 = -->
 
 | Test [msg/ms] | QuickBuffers (JSON) | Protobuf-Java (Binary) | Ratio
 | :----------- | :-----------: | :-----------: | :-----------: |
-| Car Encode  | 1515 (808 MB/s) | 985 |  1.5  
-| Market Data Encode  | 3338 (1.4 GB/s) | 3700 |  0.9 
+| Car Encode  | 1599 (852 MB/s) | 985 |  1.6  
+| Market Data Encode  | 3691 (1.5 GB/s) | 3700 |  1.0 
 
 ## Benchmark 2 - File Streams
 
-We also ran benchmarks for reading and writing streams of delimited protobuf messages with varying contents, which is similar to reading sequentially from a log file. All datasets were loaded into memory and decoded from a byte array. Neither benchmark triggers Protobuf-Java's lazy-parsing of strings, so the results may be slightly off. The benchmark code can be found in the `benchmarks` directory.
+We also ran benchmarks for reading and writing streams of delimited protobuf messages with varying contents, which is similar to reading sequentially from a log file. All datasets were loaded into memory and decoded from a byte array. This benchmark does not trigger lazy-parsing of strings, so it is primarily indicative of forwarding use cases. The benchmark code can be found in the `benchmarks` directory.
 
 |  | QuickBuffers<p>(Unsafe) | QuickBuffers<p>(without Unsafe) | Java`[1]`| JavaLite`[1]` | `[2]`
 | ----------- | -----------: | -----------: | -----------: | -----------: | ----------- |
 | **Read**  | | 
-| 1  | 173ms (502 MB/s) | 212ms (410 MB/s) |  344ms (253 MB/s)  | 567ms (153 MB/s) | 2.0
-| 2  | 102ms (559 MB/s)` | 118ms (483 MB/s) | 169ms (337 MB/s)  | 378ms (150 MB/s) | 1.7
-| 3  | 34ms (297 MB/s) | 44ms (226 MB/s) | 65ms (153 MB/s)  | 147ms (68 MB/s) | 1.9
-| 4  | 25ms (400 MB/s) | 28ms (353 MB/s) | 47ms (214 MB/s)  | 155ms (65 MB/s) | 1.9
-| 5 | 9.8ms (6.5 GB/s) | 44ms (1.5 GB/s) |  103ms (621 MB/s)  | 92ms (696 MB/s) | 10.5
+| 1  | 144ms (604 MB/s) | 149ms (584 MB/s) |  344ms (253 MB/s)  | 567ms (153 MB/s) | 2.4
+| 2  | 79ms (722 MB/s)` | 90ms (633 MB/s) | 169ms (337 MB/s)  | 378ms (150 MB/s) | 2.1
+| 3  | 30ms (333 MB/s) | 35ms (286 MB/s) | 65ms (153 MB/s)  | 147ms (68 MB/s) | 2.2
+| 4  | 21ms (476 MB/s) | 21ms (476 MB/s) | 47ms (214 MB/s)  | 155ms (65 MB/s) | 2.2
+| 5 | 7ms (9.1 GB/s) | 29ms (2.2 GB/s) |  103ms (621 MB/s)  | 92ms (696 MB/s) | 14.7
 |  **Write**`[3]`  | | |
-| 1 | 118ms (737 MB/s)  | 165ms (527 MB/s) | 157ms (554 MB/s)  | 718ms (121 MB/s)  | 1.3
-| 2 | 71ms (802 MB/s)  | 101ms (564 MB/s) | 137ms (416 MB/s)  | 308ms (188 MB/s) | 1.9
-| 3  | 23ms (435 MB/s) | 29ms (344 MB/s) | 29ms (344 MB/s)  | 101ms (99 MB/s) | 1.3
-| 4  | 16ms (625 MB/s) | 23ms (434 MB/s) | 42ms (238 MB/s)  | 97ms (103 MB/s) | 2.6
-| 5 | 6.2ms (10 GB/s)  | 46ms (1.4 GB/s) | 16ms (4.0 GB/s)  | 21ms (3.0 GB/s) | 2.5
+| 1 | 99ms (879 MB/s)  | 155ms (561 MB/s) | 157ms (554 MB/s)  | 718ms (121 MB/s)  | 1.6
+| 2 | 58ms (983 MB/s)  | 79ms (722 MB/s) | 137ms (416 MB/s)  | 308ms (188 MB/s) | 2.4
+| 3  | 17ms (588 MB/s) | 21ms (476 MB/s) | 29ms (344 MB/s)  | 101ms (99 MB/s) | 1.7
+| 4  | 14ms (714 MB/s) | 17ms (588 MB/s) | 42ms (238 MB/s)  | 97ms (103 MB/s) | 3.0
+| 5 | 6.6ms (9.7 GB/s)  | 45ms (1.4 GB/s) | 16ms (4.0 GB/s)  | 21ms (3.0 GB/s) | 2.4
 | **Read + Write** |  | 
-| 1  | 291ms (299 MB/s) | 377ms (231 MB/s) | 501ms (174 MB/s)  | 1285 ms (68 MB/s) | 1.7
-| 2 | 173ms (329 MB/s) | 219ms (260 MB/s) | 306ms (186 MB/s)  | 686 ms (83 MB/s) | 1.8
-| 3  | 57ms (176 MB/s) | 73ms (138 MB/s) | 94ms (106 MB/s)  | 248ms (40 MB/s) | 1.6
-| 4  | 41ms (244 MB/s) | 51ms (196 MB/s) | 89ms (112 MB/s)  | 252ms (40 MB/s) | 2.2
-| 5  | 16ms (4.0 GB/s) | 90ms (711 MB/s) | 119ms (537 MB/s)  | 113ms (566 MB/s) | 7.4
+| 1  | 243ms (358 MB/s) | 304ms (286 MB/s) | 501ms (174 MB/s)  | 1285 ms (68 MB/s) | 2.1
+| 2 | 137ms (416 MB/s) | 169ms (337 MB/s) | 306ms (186 MB/s)  | 686 ms (83 MB/s) | 2.2
+| 3  | 47ms (213 MB/s) | 56ms (179 MB/s) | 94ms (106 MB/s)  | 248ms (40 MB/s) | 2.0
+| 4  | 35ms (286 MB/s) | 38ms (263 MB/s) | 89ms (112 MB/s)  | 252ms (40 MB/s) | 2.5
+| 5  | 14ms (4.7 GB/s) | 75ms (859 MB/s) | 119ms (537 MB/s)  | 113ms (566 MB/s) | 8.5
 
 <!-- | 3  | ms (  MB/s) | ms (  MB/s) | ms (  MB/s)  | ms (  MB/s) | 0 -->
 
@@ -74,22 +74,22 @@ We also compared QuickBuffers against the Java bindings of Google's [FlatBuffers
 |  | QuickBuffers | FlatBuffers (v1.11.0) | FlatBuffers (v1.10.0) | Ratio`[1]`
 | :----------- | :-----------: | :-----------: | :-----------: | :-----------: |
 | **UnsafeSource / DirectByteBuffer [ns/op]**  
-| Decode             | 292 | 0 | 0 |  0.0 
-| Traverse           | 17 | 234 | 321 |  13.8
-| Encode             | 312 | 457 | 649 |  1.5
-| Encode + Decode + Traverse | 621 | 691 | 970 |  1.1
+| Decode             | 177 | 0 | 0 |  0.0 
+| Traverse           | 125 | 234 | 321 |  1.9
+| Encode             | 233 | 457 | 649 |  2.0
+| Encode + Decode + Traverse | 523 | 691 | 970 |  1.3
 | **ArraySource / HeapByteBuffer [ns/op]**  
-| Decode             | 379 | 0 | 0 |  0.0  
-| Traverse           | 29 | 381 | 427 |  13.1
-| Encode             | 334 | 626 | 821 |  1.9
-| Encode + Decode + Traverse | 742 | 1007 | 1248 |  1.4
+| Decode             | 213 | 0 | 0 |  0.0  
+| Traverse           | 133 | 381 | 427 |  2.9
+| Encode             | 268 | 626 | 821 |  2.3
+| Encode + Decode + Traverse | 614 | 1007 | 1248 |  1.6
 | **Other**  
 | Serialized Size   | 228 bytes | 344 bytes | 344 bytes |  1.5
 | Transient memory allocated during decode   | 0 bytes | 0 bytes | 0 bytes | 1
 
 * `[1]` `FlatBuffers v1.11.0 / QuickBuffers`
-* `[2]` `Traverse = (Decode + Traverse) - Decode`
+* `[2]` `Traverse = (Decode + Traverse) - Decode` (includes lazy utf8 parsing)
 
 While the official C++ benchmark shows tremendous performance benefits over Protobuf, the Java implementation has unfortunately been lagging behind a bit. Recent versions have seen some significant performance improvements, but encoding and traversing a `ByteBuffer` still results in more overhead than may be expected.
 
-Also be aware that the benchmark was created with a bias for FlatBuffers. The original data is mostly comprised of large varint numbers (e.g. a 10 byte int64) and repeated messages with multiple levels of nesting, which is a particularly bad case for Protobuf. Messages with a flatter hierarchy and more fixed-size scalar types should fare much better.
+It is also worth noting that the benchmark was created with a bias for FlatBuffers. The original data is mostly comprised of large varint numbers (e.g. a 10 byte int64) and repeated messages with multiple levels of nesting, which is a particularly bad case for Protobuf. Messages with a flatter hierarchy and more fixed-size scalar types should fare much better.
@@ -48,6 +48,16 @@
             <artifactId>flatbuffers-java</artifactId>
             <version>1.11.0</version>
         </dependency>
+        <dependency>
+            <groupId>com.fasterxml.jackson.core</groupId>
+            <artifactId>jackson-core</artifactId>
+            <version>2.10.1</version>
+        </dependency>
+        <dependency>
+            <groupId>com.google.code.gson</groupId>
+            <artifactId>gson</artifactId>
+            <version>2.8.6</version>
+        </dependency>
     </dependencies>
 
     <build>
 
@@ -42,12 +42,12 @@
  *
  * === QuickBuffers (Unsafe) ===
  * Benchmark                              Mode  Cnt    Score    Error  Units
- * PackedDoublesBenchmark.readRobo        avgt   10    9.791 ±  0.331  ms/op -- 6.5 GB/s
- * PackedDoublesBenchmark.readWriteRobo   avgt   10   16.167 ±  0.726  ms/op --
+ * PackedDoublesBenchmark.readQuick       avgt   10   7.061 ± 0.167  ms/op
+ * PackedDoublesBenchmark.readWriteQuick  avgt   10  13.618 ± 0.337  ms/op
  *
  * === QuickBuffers (Safe) ===
- * PackedDoublesBenchmark.readRobo       avgt   10  44.434 ± 0.928  ms/op -- 1.5 GB/s
- * PackedDoublesBenchmark.readWriteRobo  avgt   10  89.855 ± 3.870  ms/op --
+ * PackedDoublesBenchmark.readQuick       avgt   10  29.202 ± 0.397  ms/op
+ * PackedDoublesBenchmark.readWriteQuick  avgt   10  74.527 ± 1.353  ms/op
  *
  * === Java (Some Unsafe) ===
  * PackedDoublesBenchmark.readProto       avgt   10  103.989 ± 37.389  ms/op
@@ -85,13 +85,13 @@ public static void main(String[] args) throws RunnerException {
     final Packed message = Packed.newInstance();
 
     @Benchmark
-    public Object readRobo() throws IOException {
+    public Object readQuick() throws IOException {
         source.wrap(input);
         return message.clear().mergeFrom(source);
     }
 
     @Benchmark
-    public int readWriteRobo() throws IOException {
+    public int readWriteQuick() throws IOException {
         message.clear().mergeFrom(source.wrap(input)).writeTo(sink.wrap(output));
         return sink.position();
     }
 
@@ -8,12 +8,12 @@
  * it under the terms of the GNU General Public License as
  * published by the Free Software Foundation, either version 3 of the
  * License, or (at your option) any later version.
- * 
+ *
  * This program is distributed in the hope that it will be useful,
  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  * GNU General Public License for more details.
- * 
+ *
  * You should have received a copy of the GNU General Public
  * License along with this program.  If not, see
  * <http://www.gnu.org/licenses/gpl-3.0.html>.
@@ -51,16 +51,16 @@
  *
  * === QuickBuffers (Unsafe) ===
  * Benchmark                                Mode  Cnt   Score    Error  Units
- * SbeBenchmark.carUnsafeRoboRead           avgt   10  33.602 ± 0.568  ms/op
- * SbeBenchmark.carUnsafeRoboReadReadWrite  avgt   10  56.860 ± 1.176  ms/op
- * SbeBenchmark.marketUnsafeRoboRead        avgt   10  25.022 ± 1.249  ms/op
- * SbeBenchmark.marketUnsafeRoboReadWrite   avgt   10  41.227 ± 0.612  ms/op
+ * SbeBenchmark.carUnsafeQuickRead           avgt   10  30.661 ± 2.892  ms/op
+ * SbeBenchmark.carUnsafeQuickReadReadWrite  avgt   10  47.498 ± 2.198  ms/op
+ * SbeBenchmark.marketUnsafeQuickRead        avgt   10  21.946 ± 0.997  ms/op
+ * SbeBenchmark.marketUnsafeQuickReadWrite   avgt   10  35.220 ± 1.000  ms/op
  *
  * === QuickBuffers (Safe) ===
- * SbeBenchmark.carRoboRead                    avgt   10   44.306 ±  1.814  ms/op -- 226 MB/s
- * SbeBenchmark.carRoboReadWrite               avgt   10   72.673 ±  3.227  ms/op -- 138 MB/s
- * SbeBenchmark.marketRoboRead                 avgt   10   28.309 ±  0.242  ms/op -- 353 MB/s
- * SbeBenchmark.marketRoboReadWrite            avgt   10   51.189 ±  0.979  ms/op -- 196 MB/s
+ * SbeBenchmark.carQuickRead          avgt   10  35.540 ± 2.008  ms/op
+ * SbeBenchmark.carQuickReadWrite     avgt   10  55.914 ± 3.173  ms/op
+ * SbeBenchmark.marketQuickRead       avgt   10  21.027 ± 0.871  ms/op
+ * SbeBenchmark.marketQuickReadWrite  avgt   10  38.426 ± 0.743  ms/op
  *
  * === Protobuf-Java
  * Benchmark                          Mode  Cnt   Score    Error  Units
@@ -129,44 +129,44 @@ private static byte[] multiplyToNumBytes(byte[] singleMessage, int maxNumBytes)
 
     // ===================== UNSAFE OPTION DISABLED (e.g. Android) =====================
     @Benchmark
-    public int marketRoboRead() throws IOException {
-        return readRobo(source.wrap(marketDataMessages), marketMsg);
+    public int marketQuickRead() throws IOException {
+        return readQuick(source.wrap(marketDataMessages), marketMsg);
     }
 
     @Benchmark
-    public int marketRoboReadWrite() throws IOException {
-        return readWriteRobo(source.wrap(marketDataMessages), marketMsg, sink.wrap(output));
+    public int marketQuickReadWrite() throws IOException {
+        return readWriteQuick(source.wrap(marketDataMessages), marketMsg, sink.wrap(output));
     }
 
     @Benchmark
-    public int carRoboRead() throws IOException {
-        return readRobo(source.wrap(carDataMessages), carMsg);
+    public int carQuickRead() throws IOException {
+        return readQuick(source.wrap(carDataMessages), carMsg);
     }
 
     @Benchmark
-    public int carRoboReadWrite() throws IOException {
-        return readWriteRobo(source.wrap(carDataMessages), carMsg, sink.wrap(output));
+    public int carQuickReadWrite() throws IOException {
+        return readWriteQuick(source.wrap(carDataMessages), carMsg, sink.wrap(output));
     }
 
     // ===================== UNSAFE OPTION ENABLED =====================
     @Benchmark
-    public int marketUnsafeRoboRead() throws IOException {
-        return readRobo(unsafeSource.wrap(marketDataMessages), marketMsg);
+    public int marketUnsafeQuickRead() throws IOException {
+        return readQuick(unsafeSource.wrap(marketDataMessages), marketMsg);
     }
 
     @Benchmark
-    public int marketUnsafeRoboReadWrite() throws IOException {
-        return readWriteRobo(unsafeSource.wrap(marketDataMessages), marketMsg, unsafeSink.wrap(output));
+    public int marketUnsafeQuickReadWrite() throws IOException {
+        return readWriteQuick(unsafeSource.wrap(marketDataMessages), marketMsg, unsafeSink.wrap(output));
     }
 
     @Benchmark
-    public int carUnsafeRoboRead() throws IOException {
-        return readRobo(unsafeSource.wrap(carDataMessages), carMsg);
+    public int carUnsafeQuickRead() throws IOException {
+        return readQuick(unsafeSource.wrap(carDataMessages), carMsg);
     }
 
     @Benchmark
-    public int carUnsafeRoboReadReadWrite() throws IOException {
-        return readWriteRobo(unsafeSource.wrap(carDataMessages), carMsg, unsafeSink.wrap(output));
+    public int carUnsafeQuickReadReadWrite() throws IOException {
+        return readWriteQuick(unsafeSource.wrap(carDataMessages), carMsg, unsafeSink.wrap(output));
     }
 
     // ===================== STOCK PROTOBUF =====================
@@ -191,7 +191,7 @@ public int carProtoReadWrite() throws IOException {
     }
 
     // ===================== UTIL METHODS =====================
-    static int readRobo(final ProtoSource source, final ProtoMessage message) throws IOException {
+    static int readQuick(final ProtoSource source, final ProtoMessage message) throws IOException {
         while (!source.isAtEnd()) {
             final int length = source.readRawVarint32();
             int limit = source.pushLimit(length);
@@ -201,17 +201,11 @@ static int readRobo(final ProtoSource source, final ProtoMessage message) throws
         return source.getPosition();
     }
 
-    static int readWriteRobo(final ProtoSource source, final ProtoMessage message, final ProtoSink sink) throws IOException {
+    static int readWriteQuick(final ProtoSource source, final ProtoMessage message, final ProtoSink sink) throws IOException {
         while (!source.isAtEnd()) {
-            // read delimited
-            final int length = source.readRawVarint32();
-            int limit = source.pushLimit(length);
-            message.clearQuick().mergeFrom(source);
-            source.popLimit(limit);
-
-            // write delimited
-            sink.writeRawVarint32(message.getSerializedSize());
-            message.writeTo(sink);
+            // read/write delimited
+            source.readMessage(message.clearQuick());
+            sink.writeMessageNoTag(message);
         }
         return sink.position();
     }