when silences are detected, speaker correction is no more applied

This commit is contained in:
Quentin Fuxa
2024-08-24 19:24:00 +02:00
parent 52a755a08c
commit 4ed62e181d

View File

@@ -119,16 +119,16 @@ def format_output(state, silence, current_time, diarization, debug):
if speaker != previous_speaker:
if next_punctuation_change(i, tokens):
if speaker == -2 or previous_speaker == -2: #silences can happen anytime
lines.append(new_line(token, speaker, last_end_diarized, debug_info = ""))
continue
elif next_punctuation_change(i, tokens):
# Corrects advance:
# Are you |SPLIT SPEAKER| okay? yeah, sure. Absolutely
# should become:
# Are you okay? |SPLIT SPEAKER| yeah, sure. Absolutely
append_token_to_last_line(lines, sep, token, debug_info, last_end_diarized)
continue
elif speaker == -2 or previous_speaker == -2: #silences can happen anytime
lines.append(new_line(token, speaker, last_end_diarized, debug_info = ""))
continue
else: #we create a new speaker, but that's no ideal. We are not sure about the split. We prefer to append to previous line
# lines.append(new_line(token, speaker, last_end_diarized, debug_info = ""))
pass