TaskCfgVTT(is_cuda=True, uuid='af46875c30', cache_folder='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30', target_dir='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4', source_language='英语', source_language_code='en', source_sub='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/en.srt', source_wav='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/en.wav', source_wav_output='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/en.m4a', target_language='简体中文', target_language_code='zh-cn', target_sub='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/zh-cn.srt', target_wav='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/target.wav', target_wav_output='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/zh-cn.m4a', name='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/2026-05-03_23-09-27.mp4', noextname='2026-05-03_23-09-27', basename='2026-05-03_23-09-27.mp4', ext='mp4', dirname='//Epa-00/30tb/[Work-Space]/[Screen-Rec]/[Video-Cache]', shound_del_name=None, translate_type=1, tts_type=0, volume='+0%', pitch='+0Hz', voice_rate='+0%', voice_role='No', voice_autorate=False, video_autorate=False, remove_silent_mid=False, align_sub_audio=True, detect_language='en', recogn_type=0, model_name='large-v3-turbo', shibie_audio=None, remove_noise=False, enable_diariz=False, nums_diariz=0, rephrase=0, fix_punc=True, subtitle_language=None, app_mode='tiqu', subtitles='', targetdir_mp4='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/2026-05-03_23-09-27.mp4', novoice_mp4='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/novoice.mp4', is_separate=False, instrument=None, vocal=None, back_audio='', clear_cache=False, background_music=None, subtitle_type=0, only_out_mp4=False, recogn2pass=False, output_srt=1, copysrt_rawvideo=True)

语音识别阶段出错 [faster-whisper(本地)] Traceback (most recent call last):
File "E:\usr\Application\AI-Models\apps\pyvideotrans\videotrans\process\stt_fun.py", line 390, in faster_whisper

segments, info = batched_model.transcribe(
                 ^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages\faster_whisper\transcribe.py", line 515, in transcribe

np.stack([pad_or_trim(feature) for feature in features]) if features else []
          ^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages\faster_whisper\audio.py", line 121, in pad_or_trim

array = np.pad(array, pad_widths)
        ^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages umpy\lib\arraypad.py", line 798, in pad

padded, original_area_slice = _pad_simple(array, pad_width)
                              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\us
......
ideotrans\videotrans\recognition\_overall.py", line 105, in _faster

raws=self._new_process(callback=faster_whisper,title=title,is_cuda=self.is_cuda,kwargs=kwargs)
     ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\videotrans\configure\_base.py", line 289, in _new_process

raise RuntimeError(err)

RuntimeError: Traceback (most recent call last):
File "E:\usr\Application\AI-Models\apps\pyvideotrans\videotrans\process\stt_fun.py", line 390, in faster_whisper

segments, info = batched_model.transcribe(
                 ^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages\faster_whisper\transcribe.py", line 515, in transcribe

np.stack([pad_or_trim(feature) for feature in features]) if features else []
          ^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages\faster_whisper\audio.py", line 121, in pad_or_trim

array = np.pad(array, pad_widths)
        ^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages umpy\lib\arraypad.py", line 798, in pad

padded, original_area_slice = _pad_simple(array, pad_width)
                              ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

File "E:\usr\Application\AI-Models\apps\pyvideotrans\venv\Lib\site-packages umpy\lib\arraypad.py", line 114, in _pad_simple

padded = np.empty(new_shape, dtype=array.dtype, order=order)
         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^

numpy.core._exceptions._ArrayMemoryError: Unable to allocate 1.46 MiB for an array with shape (128, 3000) and data type float32
TaskCfgVTT(is_cuda=True, uuid='af46875c30', cache_folder='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30', target_dir='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4', source_language='英语', source_language_code='en', source_sub='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/en.srt', source_wav='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/en.wav', source_wav_output='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/en.m4a', target_language='简体中文', target_language_code='zh-cn', target_sub='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/zh-cn.srt', target_wav='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/target.wav', target_wav_output='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/zh-cn.m4a', name='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/2026-05-03_23-09-27.mp4', noextname='2026-05-03_23-09-27', basename='2026-05-03_23-09-27.mp4', ext='mp4', dirname='//Epa-00/30tb/[Work-Space]/[Screen-Rec]/[Video-Cache]', shound_del_name=None, translate_type=1, tts_type=0, volume='+0%', pitch='+0Hz', voice_rate='+0%', voice_role='No', voice_autorate=False, video_autorate=False, remove_silent_mid=False, align_sub_audio=True, detect_language='en', recogn_type=0, model_name='large-v3-turbo', shibie_audio=None, remove_noise=False, enable_diariz=False, nums_diariz=0, rephrase=0, fix_punc=True, subtitle_language=None, app_mode='tiqu', subtitles='', targetdir_mp4='G:/[Work-Space]/[Screen-Rec]/[Video-Cache]/_video_out/2026-05-03_23-09-27-mp4/2026-05-03_23-09-27.mp4', novoice_mp4='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af46875c30/novoice.mp4', is_separate=False, instrument=None, vocal=None, back_audio='', clear_cache=False, background_music=None, subtitle_type=0, only_out_mp4=False, recogn2pass=False, output_srt=1, copysrt_rawvideo=True)

=
system:Windows-10-10.0.19045-SP0
version:v3.98
frozen:False
language:zh
root_dir:E:/usr/Application/AI-Models/apps/pyvideotrans
Python: 3.12.12 | packaged by Anaconda, Inc. | (main, Oct 21 2025, 20:05:38) [MSC v.1929 64 bit (AMD64)]

#4470 TaskCfgVTT(is_cuda=True, uuid='af46875c30', cache_folder='E:/usr/Application/AI-Models/apps/pyvideotrans/tmp/28948/af468

1 Replies

请查阅相关文档：

Post Your Reply

Related resource