Spaces:

shukdevdatta123
/

WaveTalk

Running

App Files Files Community

shukdevdatta123 commited on 10 days ago

Commit

39187a7

verified ·

1 Parent(s): 0464749

Update v2.txt

Browse files

Files changed (1) hide show

v2.txt +32 -11

v2.txt CHANGED Viewed

@@ -3,11 +3,25 @@ import tempfile
 import os
 import requests
 import gradio as gr
 from openai import OpenAI
 # Available voices for audio generation
 VOICES = ["alloy", "ash", "ballad", "coral", "echo", "fable", "onyx", "nova", "sage", "shimmer", "verse"]
 def process_text_input(api_key, text_prompt, selected_voice):
     """Generate audio response from text input"""
     try:
@@ -115,9 +129,14 @@ def transcribe_audio(api_key, audio_path):
         return f"Transcription error: {str(e)}"
 def download_example_audio():
-    """Download an example audio file for testing"""
     try:
-        url = "https://cdn.openai.com/API/docs/audio/alloy.wav"
         response = requests.get(url)
         response.raise_for_status()
@@ -126,14 +145,14 @@ def download_example_audio():
         with open(temp_path, "wb") as f:
             f.write(response.content)
-        return temp_path
     except Exception as e:
-        return None
 def use_example_audio():
-    """Load example audio for the interface"""
-    audio_path = download_example_audio()
-    return audio_path
 # Create Gradio Interface
 with gr.Blocks(title="OpenAI Audio Chat App") as app:
@@ -163,7 +182,7 @@ with gr.Blocks(title="OpenAI Audio Chat App") as app:
                 text_submit = gr.Button("Generate Response")
             with gr.Column():
-                text_output = gr.Textbox(label="AI Response (Text)", lines=5)
                 audio_output = gr.Audio(label="AI Response (Audio)")
                 transcribed_output = gr.Textbox(label="Transcription of Audio Response", lines=3)
@@ -193,7 +212,8 @@ with gr.Blocks(title="OpenAI Audio Chat App") as app:
                     type="filepath",
                     sources=["microphone", "upload"]
                 )
-                example_btn = gr.Button("Use Example Audio")
                 accompanying_text = gr.Textbox(
                     label="Accompanying Text (Optional)",
@@ -208,7 +228,7 @@ with gr.Blocks(title="OpenAI Audio Chat App") as app:
                 audio_submit = gr.Button("Process Audio & Generate Response")
             with gr.Column():
-                audio_text_output = gr.Textbox(label="AI Response (Text)", lines=5)
                 audio_audio_output = gr.Audio(label="AI Response (Audio)")
                 audio_transcribed_output = gr.Textbox(label="Transcription of Audio Response", lines=3)
                 input_transcription = gr.Textbox(label="Transcription of Input Audio", lines=3)
@@ -239,7 +259,7 @@ with gr.Blocks(title="OpenAI Audio Chat App") as app:
         example_btn.click(
             fn=use_example_audio,
             inputs=[],
-            outputs=[audio_input]
         )
     with gr.Tab("Voice Samples"):
@@ -302,6 +322,7 @@ with gr.Blocks(title="OpenAI Audio Chat App") as app:
     - Audio inputs should be in WAV format
     - Available voices: alloy, ash, ballad, coral, echo, fable, onyx, nova, sage, shimmer, and verse
     - Each audio response is automatically transcribed for verification
     """)
 if __name__ == "__main__":

 import os
 import requests
 import gradio as gr
+import random
 from openai import OpenAI
 # Available voices for audio generation
 VOICES = ["alloy", "ash", "ballad", "coral", "echo", "fable", "onyx", "nova", "sage", "shimmer", "verse"]
+# Example audio URLs
+EXAMPLE_AUDIO_URLS = [
+    "https://cdn.openai.com/API/docs/audio/alloy.wav",
+    "https://cdn.openai.com/API/docs/audio/ash.wav",
+    "https://cdn.openai.com/API/docs/audio/coral.wav",
+    "https://cdn.openai.com/API/docs/audio/echo.wav",
+    "https://cdn.openai.com/API/docs/audio/fable.wav",
+    "https://cdn.openai.com/API/docs/audio/onyx.wav",
+    "https://cdn.openai.com/API/docs/audio/nova.wav",
+    "https://cdn.openai.com/API/docs/audio/sage.wav",
+    "https://cdn.openai.com/API/docs/audio/shimmer.wav"
+]
 def process_text_input(api_key, text_prompt, selected_voice):
     """Generate audio response from text input"""
     try:
         return f"Transcription error: {str(e)}"
 def download_example_audio():
+    """Download a random example audio file for testing"""
     try:
+        # Randomly select one of the example audio URLs
+        url = random.choice(EXAMPLE_AUDIO_URLS)
+        # Get the voice name from the URL for feedback
+        voice_name = url.split('/')[-1].split('.')[0]
         response = requests.get(url)
         response.raise_for_status()
         with open(temp_path, "wb") as f:
             f.write(response.content)
+        return temp_path, f"Loaded example voice: {voice_name}"
     except Exception as e:
+        return None, f"Error loading example: {str(e)}"
 def use_example_audio():
+    """Load random example audio for the interface"""
+    audio_path, message = download_example_audio()
+    return audio_path, message
 # Create Gradio Interface
 with gr.Blocks(title="OpenAI Audio Chat App") as app:
                 text_submit = gr.Button("Generate Response")
             with gr.Column():
+                text_output = gr.Textbox(label="AI Response (Checks Error)", lines=5)
                 audio_output = gr.Audio(label="AI Response (Audio)")
                 transcribed_output = gr.Textbox(label="Transcription of Audio Response", lines=3)
                     type="filepath",
                     sources=["microphone", "upload"]
                 )
+                example_btn = gr.Button("Use Random Example Audio")
+                example_message = gr.Textbox(label="Example Status", interactive=False)
                 accompanying_text = gr.Textbox(
                     label="Accompanying Text (Optional)",
                 audio_submit = gr.Button("Process Audio & Generate Response")
             with gr.Column():
+                audio_text_output = gr.Textbox(label="AI Response (Checks Error)", lines=5)
                 audio_audio_output = gr.Audio(label="AI Response (Audio)")
                 audio_transcribed_output = gr.Textbox(label="Transcription of Audio Response", lines=3)
                 input_transcription = gr.Textbox(label="Transcription of Input Audio", lines=3)
         example_btn.click(
             fn=use_example_audio,
             inputs=[],
+            outputs=[audio_input, example_message]
         )
     with gr.Tab("Voice Samples"):
     - Audio inputs should be in WAV format
     - Available voices: alloy, ash, ballad, coral, echo, fable, onyx, nova, sage, shimmer, and verse
     - Each audio response is automatically transcribed for verification
+    - The "Use Random Example Audio" button will load a random sample from OpenAI's demo voices
     """)
 if __name__ == "__main__":