|
5 | 5 | from lightning import LightningDataModule |
6 | 6 | from torch.utils.data import DataLoader |
7 | 7 | from transformers import Wav2Vec2FeatureExtractor, Wav2Vec2CTCTokenizer |
| 8 | + |
| 9 | +from vibravox.constants import LIST_OF_VIBRAVOX |
8 | 10 | from vibravox.torch_modules.dsp.data_augmentation import WaveformDataAugmentation |
9 | 11 |
|
10 | 12 |
|
11 | 13 | class STPLightningDataModule(LightningDataModule): |
12 | 14 |
|
13 | | - LIST_OF_VIBRAVOX = [ |
14 | | - "Cnam-LMSSC/vibravox", |
15 | | - "Cnam-LMSSC/vibravox2", |
16 | | - "Cnam-LMSSC/vibravox-test", |
17 | | - "Cnam-LMSSC/non_curated_vibravox", |
18 | | - "Cnam-LMSSC/vibravox_enhanced_by_EBEN", |
19 | | - ] |
20 | | - |
21 | 15 | def __init__( |
22 | 16 | self, |
23 | 17 | sample_rate: int = 16000, |
@@ -57,12 +51,12 @@ def __init__( |
57 | 51 | self.sample_rate = sample_rate |
58 | 52 | self.dataset_name_principal = dataset_name_principal |
59 | 53 | assert ( |
60 | | - dataset_name_principal in self.LIST_OF_VIBRAVOX |
| 54 | + dataset_name_principal in LIST_OF_VIBRAVOX |
61 | 55 | ), f"dataset_name_principal {dataset_name_principal} not supported." |
62 | 56 |
|
63 | 57 | self.dataset_name_secondary = dataset_name_secondary |
64 | 58 | assert ( |
65 | | - dataset_name_secondary is None or dataset_name_secondary in self.LIST_OF_VIBRAVOX |
| 59 | + dataset_name_secondary is None or dataset_name_secondary in LIST_OF_VIBRAVOX |
66 | 60 | ), f"dataset_name_secondary {dataset_name_secondary} not supported." |
67 | 61 | self.subset = subset |
68 | 62 | self.sensor = sensor |
|
0 commit comments