Compare commits

...

2 commits

Author SHA1 Message Date
Hoang Dinh ccaea823b2
Merge 4a14707f06 into 6ddfdfee6a 2024-09-08 21:48:39 +09:00
Administrator Administrator 4a14707f06 Turn on Audio Sync for audio extraction process 2024-09-01 19:38:43 -07:00
2 changed files with 3 additions and 1 deletions

View file

@ -143,7 +143,7 @@ def encode_audio_stream(path, ffmpeg_path, audio_stream_language=None):
logger.debug(f"Whisper will only use the {audio_stream_language} audio stream for {path}")
inp = inp[f'a:m:language:{audio_stream_language}']
out, _ = inp.output("-", format="s16le", acodec="pcm_s16le", ac=1, ar=16000) \
out, _ = inp.output("-", format="s16le", acodec="pcm_s16le", ac=1, ar=16000, af="aresample=async=1") \
.run(cmd=[ffmpeg_path, "-nostdin"], capture_stdout=True, capture_stderr=True)
except ffmpeg.Error as e:

View file

@ -367,6 +367,8 @@ class VideoSpeechTransformer(TransformerMixin):
"1",
"-acodec",
"pcm_s16le",
"-af",
"aresample=async=1",
"-ar",
str(self.frame_rate),
"-",