#3793 TaskCfgVTT(is_cuda=True, uuid='db73c84643', cache_folder='D:/win-pyvideotrans-v3.98-317/tmp/21040/db73c84643', target_di

221.7* Posted at: 2 hours ago 👁7

语音识别阶段出错 [openai-whisper(本地)] Traceback (most recent call last):
File "videotrans\process\stt_fun.py", line 63, in openai_whisper
File "whisper\__init__.py", line 151, in load_model
File "torch\serialization.py", line 1516, in load

return _load(

File "torch\serialization.py", line 2114, in _load

result = unpickler.load()

File "torch\_weights_only_unpickler.py", line 532, in load

self.append(self.persistent_load(pid))

File "torch\serialization.py", line 2078, in persistent_load

typed_storage = load_tensor(

File "torch\serialization.py", line 2044, in load_tensor

wrap_storage = restore_location(storage, location)

File "torch\serialization.py", line 1854, in restore_location

return default_restore_location(storage, map_location)

File "torch\serialization.py", line 698, in default_restore_location

result = fn(storage, location)

File "torch\serialization.py", line 637, in _deserialize

return obj.to(device=device)

File "torch\storage.py", line 287, in to

return _to(self, device, non_blocking)

File "torch\_utils.py", line 102, in _to

untyped_storage.copy_(self, non_blocking)

RuntimeError: CUDA error: unknown error
Compile with TORCH_USE_CUDA_DSA to enable device-side assertions.

Traceback (most recent call last):
File "videotrans\task\job.py", line 105, in run
File "videotrans\task\trans_create.py", line 360, in recogn
File "videotrans\recognition\__init__.py", line 272, in run
File "videotrans\recognition\_base.py", line 143, in run
File "videotrans\recognition\_overall.py", line 31, in _exec
File "videotrans\recognition\_overall.py", line 73, in _openai
File "videotrans\configure\_base.py", line 289, in _new_process
RuntimeError: Traceback (most recent call last):
File "videotrans\process\stt_fun.py", line 63, in openai_whisper
File "whisper\__init__.py", line 151, in load_model
File "torch\serialization.py", line 1516, in load

return _load(

File "torch\serialization.py", line 2114, in _load

result = unpickler.load()

File "torch\_weights_only_unpickler.py", line 532, in load

self.append(self.persistent_load(pid))

File "torch\serialization.py", line 2078, in persistent_load

typed_storage = load_tensor(

File "torch\serialization.py", line 2044, in load_tensor

wrap_storage = restore_location(storage, location)

File "torch\serialization.py", line 1854, in restore_location

return default_restore_location(storage, map_location)

File "torch\serialization.py", line 698, in default_restore_location

result = fn(storage, location)

File "torch\serialization.py", line 637, in _deserialize

return obj.to(device=device)

File "torch\storage.py", line 287, in to

return _to(self, device, non_blocking)

File "torch\_utils.py", line 102, in _to

untyped_storage.copy_(self, non_blocking)

RuntimeError: CUDA error: unknown error
Compile with TORCH_USE_CUDA_DSA to enable device-side assertions.
TaskCfgVTT(is_cuda=True, uuid='db73c84643', cache_folder='D:/win-pyvideotrans-v3.98-317/tmp/21040/db73c84643', target_dir='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4', source_language='英语', source_language_code='en', source_sub='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4/en.srt', source_wav='D:/win-pyvideotrans-v3.98-317/tmp/21040/db73c84643/en.wav', source_wav_output='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4/en.m4a', target_language='简体中文', target_language_code='zh-cn', target_sub='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4/zh-cn.srt', target_wav='D:/win-pyvideotrans-v3.98-317/tmp/21040/db73c84643/target.wav', target_wav_output='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4/zh-cn.m4a', name='D:/video/Dom scalp 合集/Jigsaw Trading/0.1.mp4', noextname='0.1', basename='0.1.mp4', ext='mp4', dirname='D:/video/Dom scalp 合集/Jigsaw Trading', shound_del_name=None, translate_type=0, tts_type=0, volume='+0%', pitch='+0Hz', voice_rate='+0%', voice_role='No', voice_autorate=False, video_autorate=True, remove_silent_mid=False, align_sub_audio=True, detect_language='en', recogn_type=1, model_name='large-v3-turbo', shibie_audio=None, remove_noise=False, enable_diariz=False, nums_diariz=0, rephrase=0, fix_punc=False, subtitle_language=None, app_mode='tiqu', subtitles='', targetdir_mp4='D:/video/Dom scalp 合集/Jigsaw Trading/_video_out/0.1-mp4/0.1.mp4', novoice_mp4='D:/win-pyvideotrans-v3.98-317/tmp/21040/db73c84643/novoice.mp4', is_separate=False, instrument=None, vocal=None, back_audio='', clear_cache=False, background_music=None, subtitle_type=0, only_out_mp4=False, recogn2pass=True, output_srt=2, copysrt_rawvideo=True)


=
system:Windows-10-10.0.26200-SP0
version:v3.98
frozen:True
language:zh
root_dir:D:/win-pyvideotrans-v3.98-317

1 Replies

这是由于 CUDA 环境配置问题或显卡驱动不兼容导致的。错误信息 RuntimeError: CUDA error: unknown error 表明软件在尝试使用 GPU 加载 openai-whisper 模型时,CUDA 调用失败。

解决方案:

  1. 检查 CUDA 版本:本软件内置支持 CUDA 12.8。请确认您已正确安装此版本。在 CMD 中输入 nvcc -V 查看版本。
  2. 更新显卡驱动:前往 NVIDIA 官网下载并安装最新版本的显卡驱动程序。
  3. 检查 cuDNN:确保已安装与 CUDA 12.8 匹配的 cuDNN(版本 9.11 及以上)。
  4. 临时解决方案:如果无法立即解决 CUDA 问题,可以暂时取消勾选主界面右上角的“CUDA加速”选项,软件将使用 CPU 进行语音识别(速度会慢很多)。
  5. 更换语音识别渠道:考虑使用 faster-whisper(本地) 渠道,它对 CUDA 环境的兼容性可能更好。或者,如果视频是中文发音,可以尝试 qwen-asr(本地)

请查阅相关文档:

Post Your Reply
Open source and free maintenance is not easy. If this project is helpful to you, please consider making a small donation to help the project continue to maintain and update.

Related resource