Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -228,7 +228,7 @@ def transcribe_video_with_speakers(video_path):
|
|
228 |
"start": segment["start"],
|
229 |
"end": segment["end"],
|
230 |
"text": segment["text"],
|
231 |
-
"speaker": segment
|
232 |
}
|
233 |
for segment in result["segments"]
|
234 |
]
|
@@ -588,7 +588,7 @@ def process_entry(entry, i, tts_model, video_width, video_height, process_mode,
|
|
588 |
desired_duration = entry["end"] - entry["start"]
|
589 |
desired_speed = entry['speed'] #calibrated_speed(entry['translated'], desired_duration)
|
590 |
|
591 |
-
speaker = entry.get("speaker", "
|
592 |
speaker_wav_path = f"speaker_{speaker}_sample.wav"
|
593 |
|
594 |
if process_mode > 2 and speaker_wav_path and os.path.exists(speaker_wav_path) and target_language in tts_model.synthesizer.tts_model.language_manager.name_to_id.keys():
|
|
|
228 |
"start": segment["start"],
|
229 |
"end": segment["end"],
|
230 |
"text": segment["text"],
|
231 |
+
"speaker": segment.get("speaker", "SPEAKER_00")
|
232 |
}
|
233 |
for segment in result["segments"]
|
234 |
]
|
|
|
588 |
desired_duration = entry["end"] - entry["start"]
|
589 |
desired_speed = entry['speed'] #calibrated_speed(entry['translated'], desired_duration)
|
590 |
|
591 |
+
speaker = entry.get("speaker", "SPEAKER_00")
|
592 |
speaker_wav_path = f"speaker_{speaker}_sample.wav"
|
593 |
|
594 |
if process_mode > 2 and speaker_wav_path and os.path.exists(speaker_wav_path) and target_language in tts_model.synthesizer.tts_model.language_manager.name_to_id.keys():
|