@@ -40,30 +40,31 @@ def test_pretraining_models(bundle):
4040
4141
4242@pytest .mark .parametrize (
43- "bundle,expected" ,
43+ "bundle,lang, expected" ,
4444 [
45- (WAV2VEC2_ASR_BASE_10M , 'I|HAD|THAT|CURIYOSSITY|BESID|ME|AT|THIS|MOMENT|' ),
46- (WAV2VEC2_ASR_BASE_100H , 'I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
47- (WAV2VEC2_ASR_BASE_960H , 'I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
48- (WAV2VEC2_ASR_LARGE_10M , 'I|HAD|THAT|CURIOUSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
49- (WAV2VEC2_ASR_LARGE_100H , 'I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
50- (WAV2VEC2_ASR_LARGE_960H , 'I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
51- (WAV2VEC2_ASR_LARGE_LV60K_10M , 'I|HAD|THAT|CURIOUSSITY|BESID|ME|AT|THISS|MOMENT|' ),
52- (WAV2VEC2_ASR_LARGE_LV60K_100H , 'I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
53- (WAV2VEC2_ASR_LARGE_LV60K_960H , 'I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
54- (HUBERT_ASR_LARGE , 'I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
55- (HUBERT_ASR_XLARGE , 'I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' )
45+ (WAV2VEC2_ASR_BASE_10M , 'en' , ' I|HAD|THAT|CURIYOSSITY|BESID|ME|AT|THIS|MOMENT|' ),
46+ (WAV2VEC2_ASR_BASE_100H , 'en' , ' I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
47+ (WAV2VEC2_ASR_BASE_960H , 'en' , ' I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
48+ (WAV2VEC2_ASR_LARGE_10M , 'en' , ' I|HAD|THAT|CURIOUSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
49+ (WAV2VEC2_ASR_LARGE_100H , 'en' , ' I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
50+ (WAV2VEC2_ASR_LARGE_960H , 'en' , ' I|HAD|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
51+ (WAV2VEC2_ASR_LARGE_LV60K_10M , 'en' , ' I|HAD|THAT|CURIOUSSITY|BESID|ME|AT|THISS|MOMENT|' ),
52+ (WAV2VEC2_ASR_LARGE_LV60K_100H , 'en' , ' I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
53+ (WAV2VEC2_ASR_LARGE_LV60K_960H , 'en' , ' I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
54+ (HUBERT_ASR_LARGE , 'en' , ' I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
55+ (HUBERT_ASR_XLARGE , 'en' , ' I|HAVE|THAT|CURIOSITY|BESIDE|ME|AT|THIS|MOMENT|' ),
5656 ]
5757)
5858def test_finetune_asr_model (
5959 bundle ,
60+ lang ,
6061 expected ,
61- sample_speech_16000_en ,
62+ sample_speech ,
6263 ctc_decoder ,
6364):
6465 """Smoke test of downloading weights for fine-tuning models and simple transcription"""
6566 model = bundle .get_model ().eval ()
66- waveform , sample_rate = torchaudio .load (sample_speech_16000_en )
67+ waveform , sample_rate = torchaudio .load (sample_speech )
6768 emission , _ = model (waveform )
6869 decoder = ctc_decoder (bundle .get_labels ())
6970 result = decoder (emission [0 ])
0 commit comments