#5278 TaskCfgVTT(uuid='d87b1dd66e', name='D:/win-pyvideotrans-v4.02-0616/myVideo/test.mp4', dirname='D:/win-pyvideotrans-v4.02

95.40* Posted at: 2 days ago

Batch size mismatch: audio=8, context=0:Traceback (most recent call last):
File "videotrans\process\stt_fun.py", line 559, in qwen3asr_fun
File "torch\utils\_contextlib.py", line 116, in decorate_context

return func(*args, **kwargs)

File "D:\win-pyvideotrans-v4.02-0616\_internal\qwen_asr\inference\qwen3_asr.py", line 345, in transcribe

raise ValueError(f"Batch size mismatch: audio={n}, context={len(ctxs)}")

ValueError: Batch size mismatch: audio=8, context=0
[Qwen-ASR(本地内置), Google(免费), Edge-TTS(免费)]
Traceback (most recent call last):
File "videotrans\task\only_one.py", line 47, in run
File "videotrans\task\trans_create.py", line 317, in recogn
File "videotrans\recognition\__init__.py", line 190, in run
File "videotrans\recognition\_base.py", line 94, in run
File "videotrans\recognition\_qwenasrlocal.py", line 45, in _exec
File "videotrans\configure\base.py", line 268, in _new_process
videotrans.configure.excepts.VideoTransError: Batch size mismatch: audio=8, context=0:Traceback (most recent call last):
File "videotrans\process\stt_fun.py", line 559, in qwen3asr_fun
File "torch\utils\_contextlib.py", line 116, in decorate_context

return func(*args, **kwargs)

File "D:\win-pyvideotrans-v4.02-0616\_internal\qwen_asr\inference\qwen3_asr.py", line 345, in transcribe

raise ValueError(f"Batch size mismatch: audio={n}, context={len(ctxs)}")

ValueError: Batch size mismatch: audio=8, context=0
TaskCfgVTT(uuid='d87b1dd66e', name='D:/win-pyvideotrans-v4.02-0616/myVideo/test.mp4', dirname='D:/win-pyvideotrans-v4.02-0616/myVideo', noextname='test', basename='test.mp4', ext='mp4', target_dir='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4', cache_folder='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e', is_cuda=True, source_language='英语', source_language_code='en', source_sub='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4/en.srt', source_wav='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e/en.wav', source_wav_output='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4/en.m4a', target_language='简体中文', target_language_code='zh-cn', target_sub='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4/zh-cn.srt', target_wav='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e/target.wav', target_wav_output='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4/zh-cn.m4a', translate_type=0, tts_type=0, volume='+0%', pitch='+0Hz', voice_rate='+0%', voice_role='Yunyang(Male/CN)', voice_autorate=True, video_autorate=True, remove_silent_mid=False, align_sub_audio=True, detect_language='en', recogn_type=2, model_name='1.7B', shibie_audio=None, remove_noise=False, enable_diariz=False, nums_diariz=0, rephrase=0, fix_punc=0, subtitle_language=None, app_mode='biaozhun', subtitles='', targetdir_mp4='D:/win-pyvideotrans-v4.02-0616/myVideo/test-mp4/test.mp4', novoice_mp4='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e/novoice.mp4', is_separate=False, embed_bgm=True, instrument='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e/instrument.wav', vocal='D:/win-pyvideotrans-v4.02-0616/tmp/21348/d87b1dd66e/vocal.wav', clear_cache=True, background_music='', subtitle_type=0, only_out_mp4=False, recogn2pass=False, output_srt=0, copysrt_rawvideo=False, loop_backaudio=1, backaudio_volume=0.8)


=
system:Windows-10-10.0.26200-SP0
version:v4.02
frozen:True
language:zh
root_dir:D:/win-pyvideotrans-v4.02-0616

1 Replies

这是 Qwen-ASR 本地模型的一个底层推理报错,常见于模型加载异常或音频处理时上下文信息丢失。请尝试以下步骤:

  1. 删除模型缓存重新下载
    关闭软件后,删除 models/ 目录下的 models--Qwen--Qwen3-ASR-... 文件夹(或对应缓存),重启软件,让模型在第一次使用时重新下载。
  2. 更换语音识别渠道
    可临时换用 faster-whisper(本地) + large-v3 模型,或使用在线渠道(如豆包语音大模型极速版、阿里百炼 Qwen3-ASR)。
  3. 检查音频文件
    确保输入的音频/视频时长超过 3 秒,无静音段或过短片段。若视频较短,可尝试二次识别并调整 VAD 参数(高级选项 -> 语音识别参数 -> 最短语音持续毫秒 适当增大)。
  4. 确认 CUDA 环境稳定
    如果您开启了 CUDA 加速,请确认显卡空闲显存不低于 4GB(1.7B 模型约需 3-4GB),并已正确安装 cuDNN 9.11+。

若以上方法无效,请提供 logs/ 目录下最新日志文件(底部约 30 行),以便进一步分析。

Post Your Reply
Open source and free maintenance is not easy. If this project is helpful to you, please consider making a small donation to help the project continue to maintain and update. Dondate: ko-fi.com/jianchang512

Related resource