Skip to content

Commit e161e9d

Browse files
committed
Special tokens included in the parameters
1 parent 5e6e30f commit e161e9d

File tree

2 files changed

+7
-2
lines changed

2 files changed

+7
-2
lines changed

midi_tokenizers/no_loss_tokenizer.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -54,7 +54,11 @@ def __rich_repr__(self):
5454

5555
@property
5656
def parameters(self):
57-
return {"min_time_unit": self.min_time_unit, "n_velocity_bins": self.n_velocity_bins}
57+
return {
58+
"min_time_unit": self.min_time_unit,
59+
"n_velocity_bins": self.n_velocity_bins,
60+
"special_tokens": self.special_tokens,
61+
}
5862

5963
@property
6064
def vocab_size(self) -> int:

scripts/test_tokenizer.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,6 @@
55
from fortepyan import MidiPiece
66
from datasets import load_dataset
77

8-
from midi_trainable_tokenizers import AwesomeMidiTokenizer
98
from midi_tokenizers.no_loss_tokenizer import ExponentialTimeTokenizer
109

1110

@@ -91,6 +90,8 @@ def main():
9190
print(f"MidiPieces loaded in {loading_time:.2f} seconds")
9291

9392
tokenizer = ExponentialTimeTokenizer(min_time_unit=0.01, n_velocity_bins=32)
93+
tokenizer_desc = tokenizer.to_dict()
94+
tokenizer = ExponentialTimeTokenizer.from_dict(tokenizer_desc=tokenizer_desc)
9495
# tokenizer = AwesomeMidiTokenizer.from_file("dumps/awesome_tokenizers/awesome-tokenizer-test-2024-06-11_17-11-44.json")
9596

9697
print("\nRunning speed and accuracy test for ExponentialTimeTokenizer on validation split")

0 commit comments

Comments
 (0)