55import onnx_asr .utils
66from onnx_asr .adapters import TextResultsAsrAdapter
77
8+ models = [
9+ "gigaam-v2-ctc" ,
10+ "gigaam-v2-rnnt" ,
11+ "nemo-fastconformer-ru-ctc" ,
12+ "nemo-fastconformer-ru-rnnt" ,
13+ "alphacep/vosk-model-ru" ,
14+ "alphacep/vosk-model-small-ru" ,
15+ "whisper-base" ,
16+ "onnx-community/whisper-tiny" ,
17+ ]
18+
819
920@pytest .fixture (scope = "module" )
1021def model (request : pytest .FixtureRequest ) -> TextResultsAsrAdapter :
11- return onnx_asr .load_model (request .param )
22+ return onnx_asr .load_model (request .param , quantization = "int8" if request . param != "onnx-community/whisper-tiny" else "uint8" )
1223
1324
14- @pytest .mark .parametrize ("model" , [ "alphacep/vosk-model-small-ru" , "onnx-community/whisper-tiny" , "whisper-base" ] , indirect = True )
25+ @pytest .mark .parametrize ("model" , models , indirect = True )
1526def test_supported_only_mono_audio_error (model : TextResultsAsrAdapter ) -> None :
1627 rng = np .random .default_rng (0 )
1728 waveform = rng .random ((1 * 16_000 , 2 ), dtype = np .float32 )
@@ -20,7 +31,7 @@ def test_supported_only_mono_audio_error(model: TextResultsAsrAdapter) -> None:
2031 model .recognize (waveform )
2132
2233
23- @pytest .mark .parametrize ("model" , [ "alphacep/vosk-model-small-ru" , "onnx-community/whisper-tiny" , "whisper-base" ] , indirect = True )
34+ @pytest .mark .parametrize ("model" , models , indirect = True )
2435def test_wrong_sample_rate_error (model : TextResultsAsrAdapter ) -> None :
2536 rng = np .random .default_rng (0 )
2637 waveform = rng .random ((1 * 16_000 ), dtype = np .float32 )
@@ -29,7 +40,7 @@ def test_wrong_sample_rate_error(model: TextResultsAsrAdapter) -> None:
2940 model .recognize (waveform , sample_rate = 24_000 ) # type: ignore
3041
3142
32- @pytest .mark .parametrize ("model" , [ "alphacep/vosk-model-small-ru" , "onnx-community/whisper-tiny" , "whisper-base" ] , indirect = True )
43+ @pytest .mark .parametrize ("model" , models , indirect = True )
3344def test_recognize (model : TextResultsAsrAdapter ) -> None :
3445 rng = np .random .default_rng (0 )
3546 waveform = rng .random ((1 * 16_000 ), dtype = np .float32 )
0 commit comments