@@ -7,6 +7,7 @@ import {CborldError} from './CborldError.js';
7
7
import { Converter } from './Converter.js' ;
8
8
import { Decompressor } from './Decompressor.js' ;
9
9
import { inspect } from './util.js' ;
10
+ import { default as varint } from 'varint' ;
10
11
11
12
// 0xd9 == 11011001
12
13
// 110 = CBOR major type 6
@@ -23,14 +24,16 @@ const CBORLD_TAG_SECOND_BYTE_LEGACY = 0x05;
23
24
* @param {object } options - The options to use when decoding CBOR-LD.
24
25
* @param {Uint8Array } options.cborldBytes - The encoded CBOR-LD bytes to
25
26
* decode.
26
- * @param {Function } options.documentLoader -The document loader to use when
27
+ * @param {Function } options.documentLoader - The document loader to use when
27
28
* resolving JSON-LD Context URLs.
28
29
* @param {diagnosticFunction } options.diagnose - A function that, if
29
30
* provided, is called with diagnostic information.
30
- * @param {Map } options.typeTable - A map of possible value types, including
31
+ * @param {Map } [ options.typeTable] - A map of possible value types, including
31
32
* `context`, `url`, `none`, and any JSON-LD type, each of which maps to
32
33
* another map of values of that type to their associated CBOR-LD integer
33
34
* values.
35
+ * @param {Function } [options.typeTableLoader] - The typeTable loader to use to
36
+ * resolve a registryEntryId to a typeTable.
34
37
* @param {Map } options.appContextMap - A map of context string values
35
38
* to their associated CBOR-LD integer values. For use with legacy
36
39
* cborldBytes.
@@ -40,6 +43,7 @@ const CBORLD_TAG_SECOND_BYTE_LEGACY = 0x05;
40
43
export async function decode ( {
41
44
cborldBytes, documentLoader,
42
45
typeTable,
46
+ typeTableLoader,
43
47
diagnose,
44
48
appContextMap = new Map ( ) ,
45
49
} ) {
@@ -55,7 +59,7 @@ export async function decode({
55
59
'ERR_NOT_CBORLD' ,
56
60
'CBOR-LD must start with a CBOR major type "Tag" header of `0xd9`.' ) ;
57
61
}
58
- const { suffix, isLegacy} = _getSuffix ( { cborldBytes} ) ;
62
+ const { suffix, isLegacy, registryEntryId } = _getSuffix ( { cborldBytes} ) ;
59
63
const isCompressed = _checkCompressionMode ( { cborldBytes, isLegacy} ) ;
60
64
if ( ! isCompressed ) {
61
65
return cborg . decode ( suffix , { useMaps : false } ) ;
@@ -68,6 +72,19 @@ export async function decode({
68
72
diagnose ( inspect ( input , { depth : null , colors : true } ) ) ;
69
73
}
70
74
75
+ // lookup typeTable by id if needed
76
+ if ( ! isLegacy ) {
77
+ if ( ! typeTable && typeTableLoader ) {
78
+ typeTable = await typeTableLoader ( { registryEntryId} ) ;
79
+ }
80
+ if ( ! typeTable ) {
81
+ throw new CborldError (
82
+ 'ERR_NO_TYPETABLE' ,
83
+ '"typeTable" not provided or found for registryEntryId ' +
84
+ `"${ registryEntryId } ".` ) ;
85
+ }
86
+ }
87
+
71
88
const converter = _createConverter ( {
72
89
isLegacy,
73
90
typeTable,
@@ -126,27 +143,59 @@ function _checkCompressionMode({cborldBytes, isLegacy}) {
126
143
}
127
144
128
145
function _getSuffix ( { cborldBytes} ) {
129
- const isModern = cborldBytes [ 1 ] === CBORLD_TAG_SECOND_BYTE ;
130
- const isLegacy = cborldBytes [ 1 ] === CBORLD_TAG_SECOND_BYTE_LEGACY ;
146
+ let index = 1 ; // start after 0xd9
147
+ const isModern = cborldBytes [ index ] === CBORLD_TAG_SECOND_BYTE ;
148
+ const isLegacy = cborldBytes [ index ] === CBORLD_TAG_SECOND_BYTE_LEGACY ;
131
149
if ( ! ( isModern || isLegacy ) ) {
132
150
throw new CborldError (
133
151
'ERR_NOT_CBORLD' ,
134
152
'CBOR-LD must either have a second byte of 0x06 or 0x05 (legacy).' ) ;
135
153
}
136
154
137
- const tagValue = cborldBytes [ 2 ] ;
138
- let index = 3 ;
139
- if ( isModern && tagValue >= 128 ) {
140
- // FIXME: this assumes tag length <= 31 bytes; throw error if not
141
- // cborldBytes[index + 1] is the header byte for the varint bytestring
142
- const varintArrayLength = cborldBytes [ index + 1 ] % 32 ;
143
- // This sets `index` to the index of the first byte of the second
144
- // array element in `cborldBytes`
145
- index += varintArrayLength + 2 ;
146
- }
155
+ index ++ ; // advance to tag value
147
156
const { buffer, byteOffset, length} = cborldBytes ;
157
+ const tagValue = cborldBytes [ index ] ;
158
+ let registryEntryId ;
159
+ if ( isModern ) {
160
+ if ( tagValue < 128 ) {
161
+ registryEntryId = tagValue ;
162
+ // advance to encoded data
163
+ index ++ ;
164
+ } else {
165
+ index ++ ; // advance to array
166
+ // check for 2 element array
167
+ if ( cborldBytes [ index ] !== 0x82 ) {
168
+ throw new CborldError (
169
+ 'ERR_NOT_CBORLD' ,
170
+ 'CBOR-LD large varint encoding error.' ) ;
171
+ }
172
+ index ++ ; // advance to byte string tag
173
+ // first element is tail of varint encoded as byte string
174
+ // low 5 bits are byte string length (or exceptions for large values)
175
+ const varintArrayLength = cborldBytes [ index ] % 32 ;
176
+ // don't support unbounded lengths here
177
+ if ( varintArrayLength >= 24 ) {
178
+ throw new CborldError (
179
+ 'ERR_NOT_CBORLD' ,
180
+ 'CBOR-LD encoded registryEntryId too large.' ) ;
181
+ }
182
+ // FIXME: check for bad 0 length
183
+ index ++ ; // advance to byte string data
184
+ // create single buffer for id varint initial byte and tail bytes
185
+ const varintBytes = new Uint8Array ( varintArrayLength + 1 ) ;
186
+ varintBytes [ 0 ] = tagValue ;
187
+ const varintTailBytes = new Uint8Array ( buffer , index , varintArrayLength ) ;
188
+ varintBytes . set ( varintTailBytes , 1 ) ;
189
+ // decode id from varint
190
+ registryEntryId = varint . decode ( varintBytes ) ;
191
+ // advance to second array element
192
+ index += varintArrayLength ;
193
+ }
194
+ } else {
195
+ index ++ ; // advance to tag value
196
+ }
148
197
const suffix = new Uint8Array ( buffer , byteOffset + index , length - index ) ;
149
- return { suffix, isLegacy} ;
198
+ return { suffix, isLegacy, registryEntryId } ;
150
199
}
151
200
152
201
/**
0 commit comments