Update app.py
Browse files
app.py
CHANGED
@@ -72,16 +72,17 @@ def transcribe_audio(file_path):
|
|
72 |
return "Reference not found.", "", "", "", "", "", ""
|
73 |
|
74 |
model_ids = [
|
75 |
-
"openai/whisper-tiny",
|
76 |
-
"openai/whisper-tiny.en",
|
77 |
-
"openai/whisper-base",
|
78 |
-
"openai/whisper-base.en",
|
79 |
-
"openai/whisper-medium",
|
80 |
-
"openai/whisper-medium.en",
|
81 |
-
"distil-whisper/distil-large-v3.5",
|
82 |
-
"facebook/wav2vec2-base-960h",
|
83 |
-
"facebook/wav2vec2-large-960h",
|
84 |
-
"facebook/
|
|
|
85 |
]
|
86 |
|
87 |
outputs = {}
|
@@ -144,6 +145,7 @@ with gr.Blocks() as demo:
|
|
144 |
distil_html = gr.HTML(label="Distil-Whisper Large")
|
145 |
wav2vec_base_html = gr.HTML(label="Wav2Vec2 Base")
|
146 |
wav2vec_large_html = gr.HTML(label="Wav2Vec2 Large")
|
|
|
147 |
hubert_html = gr.HTML(label="HuBERT Large")
|
148 |
|
149 |
transcribe_btn.click(
|
@@ -160,6 +162,7 @@ with gr.Blocks() as demo:
|
|
160 |
distil_html,
|
161 |
wav2vec_base_html,
|
162 |
wav2vec_large_html,
|
|
|
163 |
hubert_html,
|
164 |
],
|
165 |
)
|
|
|
72 |
return "Reference not found.", "", "", "", "", "", ""
|
73 |
|
74 |
model_ids = [
|
75 |
+
"openai/whisper-tiny", # Smallest, multilingual
|
76 |
+
"openai/whisper-tiny.en", # Tiny, English-only
|
77 |
+
"openai/whisper-base", # Balanced, multilingual
|
78 |
+
"openai/whisper-base.en", # Base, English-only
|
79 |
+
"openai/whisper-medium", # Medium, multilingual
|
80 |
+
"openai/whisper-medium.en", # Medium, English-only
|
81 |
+
"distil-whisper/distil-large-v3.5", # Distilled from Whisper large, Faster & More accurate
|
82 |
+
"facebook/wav2vec2-base-960h", # Base model trained on 960h LibriSpeech (monolingual, English)
|
83 |
+
"facebook/wav2vec2-large-960h", #Larger model, better performance (monolingual, English)
|
84 |
+
"facebook/wav2vec2-large-960h-lv60-self", # Fine-tuned on 60k LibriLight hours
|
85 |
+
"facebook/hubert-large-ls960-ft", # Fine-tuned on LibriSpeech
|
86 |
]
|
87 |
|
88 |
outputs = {}
|
|
|
145 |
distil_html = gr.HTML(label="Distil-Whisper Large")
|
146 |
wav2vec_base_html = gr.HTML(label="Wav2Vec2 Base")
|
147 |
wav2vec_large_html = gr.HTML(label="Wav2Vec2 Large")
|
148 |
+
wav2vec_lv60_html = gr.HTML(label="Wav2Vec2 Large + LibriLight")
|
149 |
hubert_html = gr.HTML(label="HuBERT Large")
|
150 |
|
151 |
transcribe_btn.click(
|
|
|
162 |
distil_html,
|
163 |
wav2vec_base_html,
|
164 |
wav2vec_large_html,
|
165 |
+
wav2vec_lv60_html,
|
166 |
hubert_html,
|
167 |
],
|
168 |
)
|