Committed by
GitHub
Avoid adding tail padding for VAD in generate-subtitles.py (#1674)
正在显示
1 个修改的文件
包含
3 行增加
和
9 行删除
| @@ -516,16 +516,13 @@ def main(): | @@ -516,16 +516,13 @@ def main(): | ||
| 516 | 516 | ||
| 517 | is_eof = False | 517 | is_eof = False |
| 518 | # TODO(fangjun): Support multithreads | 518 | # TODO(fangjun): Support multithreads |
| 519 | - while True: | 519 | + while not is_eof: |
| 520 | # *2 because int16_t has two bytes | 520 | # *2 because int16_t has two bytes |
| 521 | data = process.stdout.read(frames_per_read * 2) | 521 | data = process.stdout.read(frames_per_read * 2) |
| 522 | if not data: | 522 | if not data: |
| 523 | - if is_eof: | ||
| 524 | - break | 523 | + vad.flush() |
| 525 | is_eof = True | 524 | is_eof = True |
| 526 | - # pad 1 second at the end of the file for the VAD | ||
| 527 | - data = np.zeros(1 * args.sample_rate, dtype=np.int16) | ||
| 528 | - | 525 | + else: |
| 529 | samples = np.frombuffer(data, dtype=np.int16) | 526 | samples = np.frombuffer(data, dtype=np.int16) |
| 530 | samples = samples.astype(np.float32) / 32768 | 527 | samples = samples.astype(np.float32) / 32768 |
| 531 | 528 | ||
| @@ -536,9 +533,6 @@ def main(): | @@ -536,9 +533,6 @@ def main(): | ||
| 536 | vad.accept_waveform(buffer[:window_size]) | 533 | vad.accept_waveform(buffer[:window_size]) |
| 537 | buffer = buffer[window_size:] | 534 | buffer = buffer[window_size:] |
| 538 | 535 | ||
| 539 | - if is_eof: | ||
| 540 | - vad.flush() | ||
| 541 | - | ||
| 542 | streams = [] | 536 | streams = [] |
| 543 | segments = [] | 537 | segments = [] |
| 544 | while not vad.empty(): | 538 | while not vad.empty(): |
-
请 注册 或 登录 后发表评论