Refactor: Extract shared constants, populate __init__.py, fix Python version constraint (jhauret#63)

jhauret · web-flow · commit 452276aefa9b · 2025-11-29T23:51:55.000+11:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -4,7 +4,7 @@ version = "0.1.1"
 description = "Speech to Phoneme, Bandwidth Extension and Speaker Verification using the Vibravox dataset."
 authors = [{ name = "Julien Hauret", email = "j.hauret.33@gmail.com" }]
 readme = "README.md"
-requires-python = "==3.12.0"
+requires-python = ">=3.12.0"
 dependencies = [
     "moshi==0.2.4",
     "isort",
diff --git a/vibravox/__init__.py b/vibravox/__init__.py
@@ -0,0 +1,8 @@
+"""Vibravox: Speech to Phoneme, Bandwidth Extension and Speaker Verification using the Vibravox dataset."""
+
+from vibravox.constants import LIST_OF_VIBRAVOX, AVAILABLE_SENSORS
+
+__all__ = [
+    "LIST_OF_VIBRAVOX",
+    "AVAILABLE_SENSORS",
+]
diff --git a/vibravox/constants.py b/vibravox/constants.py
@@ -0,0 +1,20 @@
+"""Constants used throughout the vibravox package."""
+
+# List of supported Vibravox datasets
+LIST_OF_VIBRAVOX = [
+    "Cnam-LMSSC/vibravox",
+    "Cnam-LMSSC/vibravox2",
+    "Cnam-LMSSC/vibravox-test",
+    "Cnam-LMSSC/non_curated_vibravox",
+    "Cnam-LMSSC/vibravox_enhanced_by_EBEN",
+]
+
+# List of available sensors
+AVAILABLE_SENSORS = [
+    "headset_microphone",
+    "throat_microphone",
+    "forehead_accelerometer",
+    "rigid_in_ear_microphone",
+    "soft_in_ear_microphone",
+    "temple_vibration_pickup",
+]
diff --git a/vibravox/datasets/__init__.py b/vibravox/datasets/__init__.py
@@ -0,0 +1,7 @@
+"""Dataset utilities for the Vibravox package."""
+
+from vibravox.datasets.speech_noise import SpeechNoiseDataset
+
+__all__ = [
+    "SpeechNoiseDataset",
+]
diff --git a/vibravox/lightning_datamodules/__init__.py b/vibravox/lightning_datamodules/__init__.py
@@ -0,0 +1,13 @@
+"""Lightning DataModules for the Vibravox package."""
+
+from vibravox.lightning_datamodules.bwe import BWELightningDataModule
+from vibravox.lightning_datamodules.noisybwe import NoisyBWELightningDataModule
+from vibravox.lightning_datamodules.spkv import SPKVLightningDataModule
+from vibravox.lightning_datamodules.stp import STPLightningDataModule
+
+__all__ = [
+    "BWELightningDataModule",
+    "NoisyBWELightningDataModule",
+    "SPKVLightningDataModule",
+    "STPLightningDataModule",
+]
diff --git a/vibravox/lightning_datamodules/bwe.py b/vibravox/lightning_datamodules/bwe.py
@@ -7,20 +7,13 @@
 from torch.nn.utils.rnn import pad_sequence
 from torch.utils.data import DataLoader
 
+from vibravox.constants import LIST_OF_VIBRAVOX
 from vibravox.torch_modules.dsp.data_augmentation import WaveformDataAugmentation
 from vibravox.utils import set_audio_duration
 
 
 class BWELightningDataModule(LightningDataModule):
 
-    LIST_OF_VIBRAVOX = [
-        "Cnam-LMSSC/vibravox",
-        "Cnam-LMSSC/vibravox2",
-        "Cnam-LMSSC/vibravox-test",
-        "Cnam-LMSSC/non_curated_vibravox",
-        "Cnam-LMSSC/vibravox_enhanced_by_EBEN",
-    ]
-
     def __init__(
         self,
         sample_rate: int = 16000,
@@ -63,12 +56,12 @@ def __init__(
 
         self.dataset_name_principal = dataset_name_principal
         assert (
-            dataset_name_principal in self.LIST_OF_VIBRAVOX
+            dataset_name_principal in LIST_OF_VIBRAVOX
         ), f"dataset_name_principal {dataset_name_principal} not supported."
 
         self.dataset_name_secondary = dataset_name_secondary
         assert (
-            dataset_name_secondary is None or dataset_name_secondary in self.LIST_OF_VIBRAVOX
+            dataset_name_secondary is None or dataset_name_secondary in LIST_OF_VIBRAVOX
         ), f"dataset_name_secondary {dataset_name_secondary} not supported."
 
         self.subset = subset
diff --git a/vibravox/lightning_datamodules/noisybwe.py b/vibravox/lightning_datamodules/noisybwe.py
@@ -5,7 +5,6 @@
 from datasets import Audio, load_dataset
 from torch.nn.utils.rnn import pad_sequence
 from torch.utils.data import DataLoader
-from lightning import LightningDataModule
 from vibravox.utils import mix_speech_and_noise_without_rescaling
 from vibravox.utils import set_audio_duration
 from vibravox.torch_modules.dsp.data_augmentation import WaveformDataAugmentation
diff --git a/vibravox/lightning_datamodules/stp.py b/vibravox/lightning_datamodules/stp.py
@@ -5,19 +5,13 @@
 from lightning import LightningDataModule
 from torch.utils.data import DataLoader
 from transformers import Wav2Vec2FeatureExtractor, Wav2Vec2CTCTokenizer
+
+from vibravox.constants import LIST_OF_VIBRAVOX
 from vibravox.torch_modules.dsp.data_augmentation import WaveformDataAugmentation
 
 
 class STPLightningDataModule(LightningDataModule):
 
-    LIST_OF_VIBRAVOX = [
-        "Cnam-LMSSC/vibravox",
-        "Cnam-LMSSC/vibravox2",
-        "Cnam-LMSSC/vibravox-test",
-        "Cnam-LMSSC/non_curated_vibravox",
-        "Cnam-LMSSC/vibravox_enhanced_by_EBEN",
-    ]
-
     def __init__(
         self,
         sample_rate: int = 16000,
@@ -57,12 +51,12 @@ def __init__(
         self.sample_rate = sample_rate
         self.dataset_name_principal = dataset_name_principal
         assert (
-            dataset_name_principal in self.LIST_OF_VIBRAVOX
+            dataset_name_principal in LIST_OF_VIBRAVOX
         ), f"dataset_name_principal {dataset_name_principal} not supported."
 
         self.dataset_name_secondary = dataset_name_secondary
         assert (
-            dataset_name_secondary is None or dataset_name_secondary in self.LIST_OF_VIBRAVOX
+            dataset_name_secondary is None or dataset_name_secondary in LIST_OF_VIBRAVOX
         ), f"dataset_name_secondary {dataset_name_secondary} not supported."
         self.subset = subset
         self.sensor = sensor
diff --git a/vibravox/lightning_modules/__init__.py b/vibravox/lightning_modules/__init__.py
@@ -0,0 +1,15 @@
+"""Lightning Modules for the Vibravox package."""
+
+from vibravox.lightning_modules.base_se import BaseSELightningModule
+from vibravox.lightning_modules.eben import EBENLightningModule
+from vibravox.lightning_modules.ecapa2 import ECAPA2LightningModule
+from vibravox.lightning_modules.regressive_mimi import RegressiveMimiLightningModule
+from vibravox.lightning_modules.wav2vec2_for_stp import Wav2Vec2ForSTPLightningModule
+
+__all__ = [
+    "BaseSELightningModule",
+    "EBENLightningModule",
+    "ECAPA2LightningModule",
+    "RegressiveMimiLightningModule",
+    "Wav2Vec2ForSTPLightningModule",
+]
diff --git a/vibravox/metrics/__init__.py b/vibravox/metrics/__init__.py
@@ -0,0 +1,15 @@
+"""Metrics for the Vibravox package."""
+
+from vibravox.metrics.embedding_distance import BinaryEmbeddingDistance
+from vibravox.metrics.equal_error_rate import EqualErrorRate
+from vibravox.metrics.minimum_dcf import MinimumDetectionCostFunction
+from vibravox.metrics.noresqa_mos import NoresqaMOS
+from vibravox.metrics.torchsquim_stoi import TorchsquimSTOI
+
+__all__ = [
+    "BinaryEmbeddingDistance",
+    "EqualErrorRate",
+    "MinimumDetectionCostFunction",
+    "NoresqaMOS",
+    "TorchsquimSTOI",
+]
diff --git a/vibravox/torch_modules/__init__.py b/vibravox/torch_modules/__init__.py
@@ -0,0 +1,9 @@
+"""PyTorch modules for the Vibravox package."""
+
+from vibravox.torch_modules import dnn, dsp, losses
+
+__all__ = [
+    "dnn",
+    "dsp",
+    "losses",
+]
diff --git a/vibravox/torch_modules/dnn/__init__.py b/vibravox/torch_modules/dnn/__init__.py
@@ -0,0 +1,19 @@
+"""Deep Neural Network modules for the Vibravox package."""
+
+from vibravox.torch_modules.dnn.eben_discriminator import (
+    DiscriminatorEBENMultiScales,
+    DiscriminatorEBEN,
+)
+from vibravox.torch_modules.dnn.eben_generator import EBENGenerator
+from vibravox.torch_modules.dnn.melgan_discriminator import (
+    MelganMultiScalesDiscriminator,
+    DiscriminatorMelGAN,
+)
+
+__all__ = [
+    "DiscriminatorEBENMultiScales",
+    "DiscriminatorEBEN",
+    "EBENGenerator",
+    "MelganMultiScalesDiscriminator",
+    "DiscriminatorMelGAN",
+]
diff --git a/vibravox/torch_modules/dsp/__init__.py b/vibravox/torch_modules/dsp/__init__.py
@@ -0,0 +1,11 @@
+"""Digital Signal Processing modules for the Vibravox package."""
+
+from vibravox.torch_modules.dsp.data_augmentation import WaveformDataAugmentation
+from vibravox.torch_modules.dsp.pqmf import PseudoQMFBanks
+from vibravox.torch_modules.dsp.time_masking_waveform import TimeMaskingBlockWaveform
+
+__all__ = [
+    "WaveformDataAugmentation",
+    "PseudoQMFBanks",
+    "TimeMaskingBlockWaveform",
+]
diff --git a/vibravox/torch_modules/losses/__init__.py b/vibravox/torch_modules/losses/__init__.py
@@ -0,0 +1,9 @@
+"""Loss functions for the Vibravox package."""
+
+from vibravox.torch_modules.losses.feature_loss import FeatureLossForDiscriminatorMelganMultiScales
+from vibravox.torch_modules.losses.hinge_loss import HingeLossForDiscriminatorMelganMultiScales
+
+__all__ = [
+    "FeatureLossForDiscriminatorMelganMultiScales",
+    "HingeLossForDiscriminatorMelganMultiScales",
+]