You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
RROR:root:An error occurred: choose a window size 400 that is [2, 160] | 0/24 [00:00<?, ?it/s]
Traceback (most recent call last):
File "/UD-AI-TextToSpeech/text_to_speech/server_gpu.py", line 303, in audio2text
text = sense_voice_model(params)
File "/UD-AI-TextToSpeech/text_to_speech/audio_to_text/sense_voice_model.py", line 20, in call
res = self.sense_voice_model.generate(
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 263, in generate
return self.inference_with_vad(input, input_len=input_len, **cfg)
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 417, in inference_with_vad
results = self.inference(
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 302, in inference
res = model.inference(**batch, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/funasr/models/sense_voice/model.py", line 832, in inference
speech, speech_lengths = extract_fbank(
File "/usr/local/lib/python3.10/dist-packages/funasr/utils/load_utils.py", line 173, in extract_fbank
data, data_len = frontend(data, data_len, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1532, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1541, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/funasr/frontends/wav_frontend.py", line 134, in forward
mat = kaldi.fbank(
File "/usr/local/lib/python3.10/dist-packages/torchaudio/compliance/kaldi.py", line 591, in fbank
waveform, window_shift, window_size, padded_window_size = _get_waveform_and_window_properties(
File "/usr/local/lib/python3.10/dist-packages/torchaudio/compliance/kaldi.py", line 142, in _get_waveform_and_window_properties
assert 2 <= window_size <= len(waveform), "choose a window size {} that is [2, {}]".format(
AssertionError: choose a window size 400 that is [2, 160]
0%| | 0/24 [00:00<?, ?it/s]
0%| | 0/1 [00:06<?, ?it/s]
INFO:werkzeug:172.31.16.5 - - [23/Oct/2024 02:15:55] "POST /audio2text HTTP/1.1" 500 -
The text was updated successfully, but these errors were encountered:
同一个视频,在windows是好的,ubuntu上报错
RROR:root:An error occurred: choose a window size 400 that is [2, 160] | 0/24 [00:00<?, ?it/s]
Traceback (most recent call last):
File "/UD-AI-TextToSpeech/text_to_speech/server_gpu.py", line 303, in audio2text
text = sense_voice_model(params)
File "/UD-AI-TextToSpeech/text_to_speech/audio_to_text/sense_voice_model.py", line 20, in call
res = self.sense_voice_model.generate(
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 263, in generate
return self.inference_with_vad(input, input_len=input_len, **cfg)
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 417, in inference_with_vad
results = self.inference(
File "/usr/local/lib/python3.10/dist-packages/funasr/auto/auto_model.py", line 302, in inference
res = model.inference(**batch, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/funasr/models/sense_voice/model.py", line 832, in inference
speech, speech_lengths = extract_fbank(
File "/usr/local/lib/python3.10/dist-packages/funasr/utils/load_utils.py", line 173, in extract_fbank
data, data_len = frontend(data, data_len, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1532, in _wrapped_call_impl
return self._call_impl(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/module.py", line 1541, in _call_impl
return forward_call(*args, **kwargs)
File "/usr/local/lib/python3.10/dist-packages/funasr/frontends/wav_frontend.py", line 134, in forward
mat = kaldi.fbank(
File "/usr/local/lib/python3.10/dist-packages/torchaudio/compliance/kaldi.py", line 591, in fbank
waveform, window_shift, window_size, padded_window_size = _get_waveform_and_window_properties(
File "/usr/local/lib/python3.10/dist-packages/torchaudio/compliance/kaldi.py", line 142, in _get_waveform_and_window_properties
assert 2 <= window_size <= len(waveform), "choose a window size {} that is [2, {}]".format(
AssertionError: choose a window size 400 that is [2, 160]
0%| | 0/24 [00:00<?, ?it/s]
0%| | 0/1 [00:06<?, ?it/s]
INFO:werkzeug:172.31.16.5 - - [23/Oct/2024 02:15:55] "POST /audio2text HTTP/1.1" 500 -
The text was updated successfully, but these errors were encountered: