@@ -24,14 +24,6 @@ export interface TokenizerConfig {
2424 add_eos_token ?: boolean ;
2525 add_prefix_space ?: boolean ;
2626
27- // Padding and truncation
28- padding_side ?: "left" | "right" ;
29- truncation_side ?: "left" | "right" ;
30- model_max_length ?: number ;
31- max_length ?: number ;
32- stride ?: number ;
33- pad_to_multiple_of ?: number ;
34-
3527 // Cleaning and processing
3628 clean_up_tokenization_spaces ?: boolean ;
3729 split_special_tokens ?: boolean ;
@@ -74,8 +66,6 @@ export interface TokenConfig {
7466
7567export interface TokenizerJSON {
7668 version ?: string ;
77- truncation ?: TruncationConfig | null ;
78- padding ?: PaddingConfig | null ;
7969 added_tokens ?: AddedToken [ ] ;
8070 normalizer ?: TokenizerConfigNormalizer ;
8171 pre_tokenizer ?: TokenizerConfigPreTokenizer ;
@@ -84,29 +74,6 @@ export interface TokenizerJSON {
8474 model : TokenizerModelConfig ;
8575}
8676
87- // ----------------------------------------------------------------------------
88- // Truncation Configuration
89- // ----------------------------------------------------------------------------
90-
91- export interface TruncationConfig {
92- direction ?: "Left" | "Right" ;
93- max_length : number ;
94- strategy ?: "LongestFirst" | "OnlyFirst" | "OnlySecond" ;
95- stride ?: number ;
96- }
97-
98- // ----------------------------------------------------------------------------
99- // Padding Configuration
100- // ----------------------------------------------------------------------------
101-
102- export interface PaddingConfig {
103- direction ?: "Left" | "Right" ;
104- pad_id ?: number ;
105- pad_token ?: string ;
106- pad_type_id ?: number ;
107- pad_to_multiple_of ?: number | null ;
108- }
109-
11077// ----------------------------------------------------------------------------
11178// Added Tokens
11279// ----------------------------------------------------------------------------
0 commit comments