Compare commits

...

3 commits

Author SHA1 Message Date
Hoang Dinh 4febc61deb
Merge 7674ecdb2a into cc7a8000e7 2024-09-18 06:50:43 +00:00
Hoang Dinh 7674ecdb2a
Update speech_transformers.py 2024-09-17 23:50:41 -07:00
Administrator Administrator 4a14707f06 Turn on Audio Sync for audio extraction process 2024-09-01 19:38:43 -07:00

View file

@ -143,7 +143,7 @@ def encode_audio_stream(path, ffmpeg_path, audio_stream_language=None):
logger.debug(f"Whisper will only use the {audio_stream_language} audio stream for {path}")
inp = inp[f'a:m:language:{audio_stream_language}']
out, _ = inp.output("-", format="s16le", acodec="pcm_s16le", ac=1, ar=16000) \
out, _ = inp.output("-", format="s16le", acodec="pcm_s16le", ac=1, ar=16000, af="aresample=async=1") \
.run(cmd=[ffmpeg_path, "-nostdin"], capture_stdout=True, capture_stderr=True)
except ffmpeg.Error as e: