Skip to content

Commit 6f67640

Browse files
committed
Add typeTableLoader support.
Added - Add `async function typeTableLoader({registryEntryId})` option to look up the `typeTable` to use by id for both `encode` and `decode`. Changed - Refactor `registryEntryId` encoding and decoding logic. Trying to be more readable and handle more error and edge cases. This is a work in progress.
1 parent d512bcc commit 6f67640

File tree

4 files changed

+190
-52
lines changed

4 files changed

+190
-52
lines changed

CHANGELOG.md

+10
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,15 @@
11
# @digitalbazaar/cborld ChangeLog
22

3+
## 7.2.0 - 2024-10-xx
4+
5+
### Added
6+
- Add `async function typeTableLoader({registryEntryId})` option to look up the
7+
`typeTable` to use by id for both `encode` and `decode`.
8+
9+
### Changed
10+
- Refactor `registryEntryId` encoding and decoding logic. Trying to be more
11+
readable and handle more error and edge cases. This is a work in progress.
12+
313
## 7.1.3 - 2024-10-16
414

515
### Fixed

lib/decode.js

+65-16
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@ import {CborldError} from './CborldError.js';
77
import {Converter} from './Converter.js';
88
import {Decompressor} from './Decompressor.js';
99
import {inspect} from './util.js';
10+
import {default as varint} from 'varint';
1011

1112
// 0xd9 == 11011001
1213
// 110 = CBOR major type 6
@@ -23,14 +24,16 @@ const CBORLD_TAG_SECOND_BYTE_LEGACY = 0x05;
2324
* @param {object} options - The options to use when decoding CBOR-LD.
2425
* @param {Uint8Array} options.cborldBytes - The encoded CBOR-LD bytes to
2526
* decode.
26-
* @param {Function} options.documentLoader -The document loader to use when
27+
* @param {Function} options.documentLoader - The document loader to use when
2728
* resolving JSON-LD Context URLs.
2829
* @param {diagnosticFunction} options.diagnose - A function that, if
2930
* provided, is called with diagnostic information.
30-
* @param {Map} options.typeTable - A map of possible value types, including
31+
* @param {Map} [options.typeTable] - A map of possible value types, including
3132
* `context`, `url`, `none`, and any JSON-LD type, each of which maps to
3233
* another map of values of that type to their associated CBOR-LD integer
3334
* values.
35+
* @param {Function} [options.typeTableLoader] - The typeTable loader to use to
36+
* resolve a registryEntryId to a typeTable.
3437
* @param {Map} options.appContextMap - A map of context string values
3538
* to their associated CBOR-LD integer values. For use with legacy
3639
* cborldBytes.
@@ -40,6 +43,7 @@ const CBORLD_TAG_SECOND_BYTE_LEGACY = 0x05;
4043
export async function decode({
4144
cborldBytes, documentLoader,
4245
typeTable,
46+
typeTableLoader,
4347
diagnose,
4448
appContextMap = new Map(),
4549
}) {
@@ -55,7 +59,7 @@ export async function decode({
5559
'ERR_NOT_CBORLD',
5660
'CBOR-LD must start with a CBOR major type "Tag" header of `0xd9`.');
5761
}
58-
const {suffix, isLegacy} = _getSuffix({cborldBytes});
62+
const {suffix, isLegacy, registryEntryId} = _getSuffix({cborldBytes});
5963
const isCompressed = _checkCompressionMode({cborldBytes, isLegacy});
6064
if(!isCompressed) {
6165
return cborg.decode(suffix, {useMaps: false});
@@ -68,6 +72,19 @@ export async function decode({
6872
diagnose(inspect(input, {depth: null, colors: true}));
6973
}
7074

75+
// lookup typeTable by id if needed
76+
if(!isLegacy) {
77+
if(!typeTable && typeTableLoader) {
78+
typeTable = await typeTableLoader({registryEntryId});
79+
}
80+
if(!typeTable) {
81+
throw new CborldError(
82+
'ERR_NO_TYPETABLE',
83+
'"typeTable" not provided or found for registryEntryId ' +
84+
`"${registryEntryId}".`);
85+
}
86+
}
87+
7188
const converter = _createConverter({
7289
isLegacy,
7390
typeTable,
@@ -126,27 +143,59 @@ function _checkCompressionMode({cborldBytes, isLegacy}) {
126143
}
127144

128145
function _getSuffix({cborldBytes}) {
129-
const isModern = cborldBytes[1] === CBORLD_TAG_SECOND_BYTE;
130-
const isLegacy = cborldBytes[1] === CBORLD_TAG_SECOND_BYTE_LEGACY;
146+
let index = 1; // start after 0xd9
147+
const isModern = cborldBytes[index] === CBORLD_TAG_SECOND_BYTE;
148+
const isLegacy = cborldBytes[index] === CBORLD_TAG_SECOND_BYTE_LEGACY;
131149
if(!(isModern || isLegacy)) {
132150
throw new CborldError(
133151
'ERR_NOT_CBORLD',
134152
'CBOR-LD must either have a second byte of 0x06 or 0x05 (legacy).');
135153
}
136154

137-
const tagValue = cborldBytes[2];
138-
let index = 3;
139-
if(isModern && tagValue >= 128) {
140-
// FIXME: this assumes tag length <= 31 bytes; throw error if not
141-
// cborldBytes[index + 1] is the header byte for the varint bytestring
142-
const varintArrayLength = cborldBytes[index + 1] % 32;
143-
// This sets `index` to the index of the first byte of the second
144-
// array element in `cborldBytes`
145-
index += varintArrayLength + 2;
146-
}
155+
index++; // advance to tag value
147156
const {buffer, byteOffset, length} = cborldBytes;
157+
const tagValue = cborldBytes[index];
158+
let registryEntryId;
159+
if(isModern) {
160+
if(tagValue < 128) {
161+
registryEntryId = tagValue;
162+
// advance to encoded data
163+
index++;
164+
} else {
165+
index++; // advance to array
166+
// check for 2 element array
167+
if(cborldBytes[index] !== 0x82) {
168+
throw new CborldError(
169+
'ERR_NOT_CBORLD',
170+
'CBOR-LD large varint encoding error.');
171+
}
172+
index++; // advance to byte string tag
173+
// first element is tail of varint encoded as byte string
174+
// low 5 bits are byte string length (or exceptions for large values)
175+
const varintArrayLength = cborldBytes[index] % 32;
176+
// don't support unbounded lengths here
177+
if(varintArrayLength >= 24) {
178+
throw new CborldError(
179+
'ERR_NOT_CBORLD',
180+
'CBOR-LD encoded registryEntryId too large.');
181+
}
182+
// FIXME: check for bad 0 length
183+
index++; // advance to byte string data
184+
// create single buffer for id varint initial byte and tail bytes
185+
const varintBytes = new Uint8Array(varintArrayLength + 1);
186+
varintBytes[0] = tagValue;
187+
const varintTailBytes = new Uint8Array(buffer, index, varintArrayLength);
188+
varintBytes.set(varintTailBytes, 1);
189+
// decode id from varint
190+
registryEntryId = varint.decode(varintBytes);
191+
// advance to second array element
192+
index += varintArrayLength;
193+
}
194+
} else {
195+
index++; // advance to tag value
196+
}
148197
const suffix = new Uint8Array(buffer, byteOffset + index, length - index);
149-
return {suffix, isLegacy};
198+
return {suffix, isLegacy, registryEntryId};
150199
}
151200

152201
/**

lib/encode.js

+39-32
Original file line numberDiff line numberDiff line change
@@ -30,10 +30,12 @@ const typeEncoders = {
3030
* @param {number|string} [options.registryEntryId='legacy] - The registry
3131
* entry ID for the registry entry associated with the resulting CBOR-LD
3232
* payload. For legacy support, use registryEntryId = 'legacy'.
33-
* @param {Map} options.typeTable - A map of possible value types, including
33+
* @param {Map} [options.typeTable] - A map of possible value types, including
3434
* `context`, `url`, `none`, and any JSON-LD type, each of which maps to
3535
* another map of values of that type to their associated CBOR-LD integer
3636
* values.
37+
* @param {Function} [options.typeTableLoader] - The typeTable loader to use to
38+
* resolve a registryEntryId to a typeTable.
3739
* @param {diagnosticFunction} options.diagnose - A function that, if
3840
* provided, is called with diagnostic information.
3941
* @param {Map} options.appContextMap - For use with the legacy value of
@@ -46,11 +48,11 @@ const typeEncoders = {
4648
export async function encode({
4749
jsonldDocument, documentLoader, registryEntryId = 'legacy',
4850
typeTable,
51+
typeTableLoader,
4952
diagnose,
5053
appContextMap,
5154
compressionMode
5255
} = {}) {
53-
5456
// validate that an acceptable value for `registryEntryId` was passed
5557
if(!((typeof registryEntryId === 'number' && registryEntryId > 0) ||
5658
registryEntryId === 'legacy')) {
@@ -96,6 +98,10 @@ export async function encode({
9698
// output uncompressed CBOR-LD
9799
suffix = cborg.encode(jsonldDocument);
98100
} else {
101+
// lookup typeTable by id if needed
102+
if(!isLegacy && !typeTable && typeTableLoader) {
103+
typeTable = await typeTableLoader({registryEntryId});
104+
}
99105
const converter = _createConverter({
100106
isLegacy,
101107
typeTable,
@@ -125,27 +131,34 @@ export async function encode({
125131
return bytes;
126132
}
127133

128-
/**
129-
* A diagnostic function that is called with diagnostic information. Typically
130-
* set to `console.log` when debugging.
131-
*
132-
* @callback diagnosticFunction
133-
* @param {string} message - The diagnostic message.
134-
*/
135-
136134
function _getPrefix({isLegacy, compressionMode, registryEntryId}) {
137135
if(isLegacy) {
138-
return new Uint8Array([0xd9, 0x05, compressionMode]);
136+
return new Uint8Array([
137+
0xd9, // CBOR major type 6 + 2 byte tag size
138+
0x05, // legacy CBOR-LD tag
139+
compressionMode // compression flag
140+
]);
139141
}
140-
const {
141-
varintTagValue, varintByteValue
142-
} = _getVarintStructure(registryEntryId);
143-
if(varintByteValue) {
144-
// Define varintByteValue as first element in 2 element array
145-
// `0x82` means "the following is a 2 element array"
146-
return [...varintTagValue, 0x82, ...varintByteValue];
142+
if(registryEntryId < 128) {
143+
return new Uint8Array([
144+
0xd9, // CBOR major type 6 + 2 byte tag size
145+
0x06, // non-legacy CBOR-LD tag
146+
registryEntryId // low-value type table id
147+
// encoded document appended in caller
148+
]);
147149
}
148-
return varintTagValue;
150+
const idVarint = varint.encode(registryEntryId);
151+
152+
return new Uint8Array([
153+
0xd9, // CBOR major type 6 + 2 byte tag size
154+
0x06, // non-legacy CBOR-LD tag
155+
idVarint[0],
156+
...[
157+
0x82, // 2 element array
158+
...cborg.encode(Uint8Array.from(idVarint.slice(1)))
159+
// encoded document appended as second element in caller
160+
]
161+
]);
149162
}
150163

151164
function _createConverter({
@@ -166,16 +179,10 @@ function _createConverter({
166179
});
167180
}
168181

169-
function _getVarintStructure(registryEntryId) {
170-
let varintTagValue;
171-
let varintByteValue;
172-
if(registryEntryId < 128) {
173-
varintTagValue = new Uint8Array([0xd9, 0x06, registryEntryId]);
174-
varintByteValue = null;
175-
} else {
176-
const varintArray = varint.encode(registryEntryId);
177-
varintTagValue = new Uint8Array([0xd9, 0x06, varintArray[0]]);
178-
varintByteValue = cborg.encode(Uint8Array.from(varintArray.slice(1)));
179-
}
180-
return {varintTagValue, varintByteValue};
181-
}
182+
/**
183+
* A diagnostic function that is called with diagnostic information. Typically
184+
* set to `console.log` when debugging.
185+
*
186+
* @callback diagnosticFunction
187+
* @param {string} message - The diagnostic message.
188+
*/

tests/decode.spec.js

+76-4
Original file line numberDiff line numberDiff line change
@@ -14,32 +14,104 @@ import {
1414
TYPE_TABLE,
1515
} from '../lib/tables.js';
1616

17+
function _makeTypeTableLoader(entries) {
18+
const typeTables = new Map(entries);
19+
return async function({registryEntryId}) {
20+
return typeTables.get(registryEntryId);
21+
};
22+
}
23+
1724
describe('cborld decode', () => {
25+
it('should decode CBOR-LD bytes (direct type table)',
26+
async () => {
27+
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x01, 0xa0]);
28+
const jsonldDocument = await decode({
29+
cborldBytes,
30+
typeTable: new Map()
31+
});
32+
expect(jsonldDocument).deep.equal({});
33+
});
34+
35+
it('should decode CBOR-LD bytes (type table loader)',
36+
async () => {
37+
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x01, 0xa0]);
38+
const jsonldDocument = await decode({
39+
cborldBytes,
40+
typeTableLoader: _makeTypeTableLoader([[0x01, new Map()]])
41+
});
42+
expect(jsonldDocument).deep.equal({});
43+
});
44+
45+
it('should fail to decode with no typeTable or typeTableLoader',
46+
async () => {
47+
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x01, 0xa0]);
48+
let result;
49+
let error;
50+
try {
51+
result = await decode({
52+
cborldBytes
53+
});
54+
} catch(e) {
55+
error = e;
56+
}
57+
expect(result).to.eql(undefined);
58+
expect(error?.code).to.eql('ERR_NO_TYPETABLE');
59+
});
60+
61+
it('should fail to decode with no typeTableLoader id',
62+
async () => {
63+
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x01, 0xa0]);
64+
let result;
65+
let error;
66+
try {
67+
result = await decode({
68+
cborldBytes,
69+
typeTableLoader: _makeTypeTableLoader([])
70+
});
71+
} catch(e) {
72+
error = e;
73+
}
74+
expect(result).to.eql(undefined);
75+
expect(error?.code).to.eql('ERR_NO_TYPETABLE');
76+
});
77+
1878
it('should decode empty document CBOR-LD bytes', async () => {
1979
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x01, 0xa0]);
20-
const jsonldDocument = await decode({cborldBytes});
80+
const jsonldDocument = await decode({
81+
cborldBytes,
82+
typeTableLoader: _makeTypeTableLoader([[0x01, new Map()]])
83+
});
2184
expect(jsonldDocument).deep.equal({});
2285
});
2386

2487
it('should decode empty JSON-LD document bytes with varint', async () => {
2588
const cborldBytes = new Uint8Array([0xd9, 0x06, 0x10, 0xa0]);
26-
const jsonldDocument = await decode({cborldBytes});
89+
const jsonldDocument = await decode({
90+
cborldBytes,
91+
typeTableLoader: _makeTypeTableLoader([[0x10, new Map()]])
92+
});
2793
expect(jsonldDocument).deep.equal({});
2894
});
2995

3096
it('should decode empty JSON-LD document bytes with varint >1 byte',
3197
async () => {
3298
const cborldBytes = new Uint8Array(
3399
[0xd9, 0x06, 0x80, 0x82, 0x41, 0x01, 0xa0]);
34-
const jsonldDocument = await decode({cborldBytes});
100+
const jsonldDocument = await decode({
101+
cborldBytes,
102+
typeTableLoader: _makeTypeTableLoader([[0x80, new Map()]])
103+
});
35104
expect(jsonldDocument).deep.equal({});
36105
});
37106

38107
it('should decode an empty JSON-LD document with multiple byte varint',
39108
async () => {
40109
const cborldBytes = new Uint8Array(
41110
[0xd9, 0x06, 0x80, 0x82, 0x44, 0x94, 0xeb, 0xdc, 0x03, 0xa0]);
42-
const jsonldDocument = await decode({cborldBytes});
111+
const jsonldDocument = await decode({
112+
cborldBytes,
113+
typeTableLoader: _makeTypeTableLoader([[1000000000, new Map()]])
114+
});
43115
expect(jsonldDocument).deep.equal({});
44116
});
45117

0 commit comments

Comments
 (0)