Open ExpressGit opened 4 months ago
10分钟的音频 依然没有时间戳 模型;whisper-large-v3
from funasr import AutoModel
model = AutoModel( model="iic/Whisper-large-v3", vad_model="iic/speech_fsmn_vad_zh-cn-16k-common-pytorch", vad_kwargs={"max_single_segment_time": 30000}, )
DecodingOptions = { "task": "transcribe", "language": None, "without_timestamps": False, }
res = model.generate( DecodingOptions=DecodingOptions, batch_size_s=0, input="data/ch_multi.wav", )
print(res)
pip
Please update funasr by source code.
10分钟的音频 依然没有时间戳 模型;whisper-large-v3
❓ Questions and Help
from funasr import AutoModel
model = AutoModel( model="iic/Whisper-large-v3", vad_model="iic/speech_fsmn_vad_zh-cn-16k-common-pytorch", vad_kwargs={"max_single_segment_time": 30000}, )
DecodingOptions = { "task": "transcribe", "language": None, "without_timestamps": False, }
res = model.generate( DecodingOptions=DecodingOptions, batch_size_s=0, input="data/ch_multi.wav", )
print(res)
pip
, source):pip