报错信息:
语音识别阶段出错 [faster-whisper(本地)] 无效的值或参数:Could not load model G:/pyvideotrans-v3.92/models/whisper-large-v3-japanese-4k-steps-ct2 with any of the following classes: (, ). See the original errors:
while loading with AutoModelForCTC, an error is thrown:
Traceback (most recent call last):
File "transformers\pipelines\base.py", line 293, in infer_framework_load_model
model = model_class.from_pretrained(model, **kwargs)File "transformers\models\auto\auto_factory.py", line 607, in from_pretrained
raise ValueError(ValueError: Unrecognized configuration class for this kind of AutoModel: AutoModelForCTC.
Model type should be one of Data2VecAudioConfig, HubertConfig, MCTCTConfig, ParakeetCTCConfig, SEWConfig, SEWDConfig, UniSpeechConfig, UniSpeechSatConfig, Wav2Vec2Config, Wav2Vec2BertConfig, Wav2Vec2ConformerConfig, WavLMConfig.
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "transformers\pipeline
......
g, WavLMConfig.
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "transformers\pipelines\base.py", line 311, in infer_framework_load_model
model = model_class.from_pretrained(model, **fp32_kwargs)File "transformers\models\auto\auto_factory.py", line 607, in from_pretrained
raise ValueError(ValueError: Unrecognized configuration class for this kind of AutoModel: AutoModelForCTC.
Model type should be one of Data2VecAudioConfig, HubertConfig, MCTCTConfig, ParakeetCTCConfig, SEWConfig, SEWDConfig, UniSpeechConfig, UniSpeechSatConfig, Wav2Vec2Config, Wav2Vec2BertConfig, Wav2Vec2ConformerConfig, WavLMConfig.
while loading with AutoModelForSpeechSeq2Seq, an error is thrown:
Traceback (most recent call last):
File "transformers\pipelines\base.py", line 293, in infer_framework_load_model
model = model_class.from_pretrained(model, **kwargs)File "transformers\models\auto\auto_factory.py", line 604, in from_pretrained
return model_class.from_pretrained(File "transformers\modeling_utils.py", line 277, in _wrapper
return func(*args, **kwargs)File "transformers\modeling_utils.py", line 4900, in from_pretrained
checkpoint_files, sharded_metadata = _get_resolved_checkpoint_files(File "transformers\modeling_utils.py", line 989, in _get_resolved_checkpoint_files
raise OSError(OSError: Error no file named pytorch_model.bin, model.safetensors, tf_model.h5, model.ckpt.index or flax_model.msgpack found in directory G:/pyvideotrans-v3.92/models/whisper-large-v3-japanese-4k-steps-ct2.
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "transformers\pipelines\base.py", line 311, in infer_framework_load_model
model = model_class.from_pretrained(model, **fp32_kwargs)File "transformers\models\auto\auto_factory.py", line 604, in from_pretrained
return model_class.from_pretrained(File "transformers\modeling_utils.py", line 277, in _wrapper
return func(*args, **kwargs)File "transformers\modeling_utils.py", line 4900, in from_pretrained
checkpoint_files, sharded_metadata = _get_resolved_checkpoint_files(File "transformers\modeling_utils.py", line 989, in _get_resolved_checkpoint_files
raise OSError(OSError: Error no file named pytorch_model.bin, model.safetensors, tf_model.h5, model.ckpt.index or flax_model.msgpack found in directory G:/pyvideotrans-v3.92/models/whisper-large-v3-japanese-4k-steps-ct2.
TaskCfg(cache_folder='G:/pyvideotrans-v3.92/tmp/18904/8efb566437', target_dir='D:/ffout/_video_out/0.序章-mp3', remove_noise=False, is_separate=False, detect_language='ja', subtitle_language=None, source_language='日语', target_language='-', source_language_code='ja', target_language_code=None, source_sub='D:/ffout/_video_out/0.序章-mp3/ja.srt', target_sub='D:/ffout/_video_out/0.序章-mp3/None.srt', source_wav='G:/pyvideotrans-v3.92/tmp/18904/8efb566437/ja.wav', source_wav_output='D:/ffout/_video_out/0.序章-mp3/ja.m4a', target_wav='G:/pyvideotrans-v3.92/tmp/18904/8efb566437/target.wav', target_wav_output='D:/ffout/_video_out/0.序章-mp3/None.m4a', subtitles='', novoice_mp4='G:/pyvideotrans-v3.92/tmp/18904/8efb566437/novoice.mp4', noextname='0.序章', shibie_audio=None, targetdir_mp4='D:/ffout/_video_out/0.序章-mp3/0.序章.mp4', instrument=None, vocal=None, back_audio='', background_music=None, app_mode='tiqu', subtitle_type=0, volume='+0%', pitch='+0Hz', voice_rate='+0%', voice_role='No', copysrt_rawvideo=False, clear_cache=False, translate_type=0, tts_type=0, recogn_type=0, model_name='JhonVanced/whisper-large-v3-japanese-4k-steps-ct2', split_type=0, voice_autorate=False, video_autorate=False, cuda=True, name='D:/ffout/0.序章.mp3', basename='0.序章.mp3', ext='mp3', dirname='D:/ffout', shound_del_name=None, uuid='8efb566437', remove_silent_mid=False, align_sub_audio=True, enable_diariz=False, nums_diariz=0, rephrase=0, only_out_mp4=False)




