Spaces:

Tamiloneto8
/

Oneto8-test

Sleeping

App Files Files Community

Tamiloneto8 commited on Jul 15

Commit

888cc03

verified ·

1 Parent(s): ed008e7

Update app.py

Browse files

Files changed (1) hide show

app.py +119 -68

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ logger = logging.getLogger(__name__)
 # It's recommended to set the HUGGINGFACE_TOKEN as an environment variable
 token = os.getenv("HUGGINGFACE_TOKEN")
-def create_dubindic_interface():
     """
     Creates and configures the Gradio interface for the DubIndic application.
     """
@@ -23,22 +23,24 @@ def create_dubindic_interface():
     except Exception as e:
         logger.error("Error connecting to the private space: %s", e, exc_info=True)
         # Create a fallback interface to show the connection error
-        with gr.Blocks(theme=gr_themes.Soft()) as demo:
-            gr.Markdown("# 🚨 DubIndic - Connection Error")
-            gr.Markdown(f"**Error Details:** {str(e)}")
-            gr.Markdown("Please check your Hugging Face token and ensure the Space 'Tamiloneto8/Test1' is running.")
         return demo
     # Define wrapper functions to call the API endpoints
     def start_processing(audio_file, target_language):
         if not audio_file or not target_language:
-            gr.Warning("Please provide both an audio file and select a target language.")
             return (
-                "⚠️ Waiting for input...", None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
         try:
-            gr.Info("Starting processing... This may take a moment.")
             logger.info("Calling /process_audio_pipeline_step1 with file: %s", audio_file)
             result = client.predict(
                 audio_file=handle_file(audio_file),
@@ -46,50 +48,54 @@ def create_dubindic_interface():
                 api_name="/process_audio_pipeline_step1"
             )
             logger.info("Received result from step 1: %s", result)
-            gr.Info("Processing started! The first chunk is ready for editing.")
             return (
-                f"✅ {result[0]}", result[2], result[3], result[4], result[5], result[6],
-                gr.update(visible=True), gr.update(visible=True)
             )
         except Exception as e:
             logger.error("Error in start_processing: %s", e, exc_info=True)
-            gr.Error(f"Error starting process: {e}")
             return (
-                f"❌ Error: {str(e)}", None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
     def navigate_chunk(transcription, translation, direction):
         api_to_call = "/lambda" if direction == "prev" else "/lambda_1"
         try:
             logger.info("Calling %s to navigate.", api_to_call)
-            result = client.predict(t=transcription, tr=translation, api_name=api_to_call)
             logger.info("Received result from navigation: %s", result)
             return result[1], result[2], result[3], result[4], result[5]
         except Exception as e:
             logger.error("Error navigating chunks: %s", e, exc_info=True)
-            gr.Warning(f"Navigation error: {e}")
-            # Return gr.update() to avoid changing the component values on error
-            return gr.update(), gr.update(), gr.update(), gr.update(), gr.update()
     def generate_dubbed_chunk(transcription, translation):
         if not transcription and not translation:
-            gr.Warning("Cannot generate audio from empty text fields.")
             return None
         try:
             logger.info("Calling /generate_dubbed_chunk.")
-            gr.Info("Generating dubbed audio for the current chunk...")
             dubbed_path = client.predict(
                 transcription=transcription,
                 translation=translation,
                 api_name="/generate_dubbed_chunk"
             )
             logger.info("Received dubbed chunk: %s", dubbed_path)
-            gr.Info("Dubbed chunk generated successfully!")
             return dubbed_path
         except Exception as e:
             logger.error("Error generating dubbed chunk: %s", e, exc_info=True)
-            gr.Error(f"Error generating audio: {e}")
             return None
     def finalize_current_chunk():
@@ -97,69 +103,113 @@ def create_dubindic_interface():
             logger.info("Calling /finalize_current_chunk.")
             progress = client.predict(api_name="/finalize_current_chunk")
             logger.info("Received finalization progress: %s", progress)
-            gr.Info("Chunk finalized!")
-            return f"✅ {progress}"
         except Exception as e:
             logger.error("Error finalizing chunk: %s", e, exc_info=True)
-            gr.Error(f"Error finalizing chunk: {e}")
-            return f"❌ Error finalizing: {str(e)}"
     def merge_all_chunks():
         try:
             logger.info("Calling /merge_audio_files.")
-            gr.Info("Merging all finalized chunks. This may take a moment...")
             final_status, final_audio = client.predict(api_name="/merge_audio_files")
             logger.info("Received final merged audio.")
-            gr.Info("Merge complete! Final audio is ready.")
-            return f"🎉 {final_status}", final_audio
         except Exception as e:
             logger.error("Error merging audio files: %s", e, exc_info=True)
-            gr.Error(f"Merge error: {e}")
-            return f"❌ Merge error: {str(e)}", None
-    # Create custom theme
-    custom_theme = gr_themes.Soft(primary_hue="orange", secondary_hue="red", neutral_hue="slate")
-    # Define the Gradio interface
-    with gr.Blocks(theme=custom_theme, title="DubIndic - AI Audio Dubbing") as demo:
-        gr.Markdown('<div style="text-align: center; font-size: 2.5rem; font-weight: 800; margin-bottom: 1rem;">🎬 DubIndic - AI Audio Dubbing Pipeline</div>')
-        gr.Markdown('<div style="text-align: center; margin-bottom: 2rem; font-size: 1.1rem; color: #666;">Transform your audio into another Indian language with full editing control</div>')
-        # Step 1
-        with gr.Group():
-            gr.Markdown("### 📤 Step 1: Upload & Configure")
-            with gr.Row():
                 audio_input = gr.Audio(sources=["upload"], type="filepath", label="🎵 Upload Audio File")
                 lang_dropdown = gr.Dropdown(
                     choices=["Assamese", "Bengali", "Gujarati", "Hindi", "Kannada", "Malayalam", "Marathi", "Odia", "Punjabi", "Tamil", "Telugu"],
                     label="🌐 Target Language"
                 )
-            process_btn = gr.Button("🎯 Start Processing", variant="primary")
-            step1_output = gr.Textbox(label="📊 Processing Status", interactive=False)
-        # Step 2
-        with gr.Group(visible=False) as edit_section:
-            gr.Markdown("### ✏️ Step 2: Edit, Generate & Finalize")
             with gr.Row():
                 prev_btn = gr.Button("◀️ Previous")
                 next_btn = gr.Button("Next ▶️")
             with gr.Row():
-                original_audio = gr.Audio(label="🎵 Original Chunk Audio", type="filepath", interactive=False)
-                dubbed_audio = gr.Audio(label="🎤 Dubbed Chunk Audio", type="filepath", interactive=False)
-            transcription_text = gr.Textbox(label="📝 Transcription (edit if needed)", lines=3, interactive=True)
-            translation_text = gr.Textbox(label="🔄 Translation (edit if needed)", lines=3, interactive=True)
-            with gr.Row():
-                generate_btn = gr.Button("🔊 Generate Dubbed Chunk", variant="secondary")
                 finalize_btn = gr.Button("✔️ Finalize Chunk", variant="secondary")
-            progress_text = gr.Textbox(label="📈 Progress", interactive=False)
-        # Step 3
-        with gr.Group(visible=False) as merge_section:
             gr.Markdown("### 🏁 Step 3: Merge Final Audio")
             merge_btn = gr.Button("🚀 Merge All Finalized Chunks", variant="primary")
-            with gr.Row():
-                final_output = gr.Textbox(label="🎉 Final Results", interactive=False)
-                output_audio = gr.Audio(label="🔊 Final Dubbed Audio", type="filepath", interactive=False)
         # Connect functions to UI components
         process_btn.click(
@@ -167,41 +217,42 @@ def create_dubindic_interface():
             inputs=[audio_input, lang_dropdown],
             outputs=[step1_output, original_audio, transcription_text, translation_text, dubbed_audio, progress_text, edit_section, merge_section]
         )
         prev_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "prev"),
             inputs=[transcription_text, translation_text],
             outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         next_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "next"),
             inputs=[transcription_text, translation_text],
             outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         generate_btn.click(
             fn=generate_dubbed_chunk,
             inputs=[transcription_text, translation_text],
             outputs=[dubbed_audio]
         )
         finalize_btn.click(
             fn=finalize_current_chunk,
             inputs=[],
             outputs=[progress_text]
         )
         merge_btn.click(
             fn=merge_all_chunks,
             inputs=[],
             outputs=[final_output, output_audio]
         )
     return demo
 if __name__ == "__main__":
-    dubindic_interface = create_dubindic_interface()
-    if dubindic_interface:
-        dubindic_interface.launch(
-            show_error=True,
-            share=False,
-            server_name="0.0.0.0",
-            server_port=7860
-        )
     else:
         logger.error("Failed to create the Gradio interface.")

 # It's recommended to set the HUGGINGFACE_TOKEN as an environment variable
 token = os.getenv("HUGGINGFACE_TOKEN")
+def create_DubIndic_interface():
     """
     Creates and configures the Gradio interface for the DubIndic application.
     """
     except Exception as e:
         logger.error("Error connecting to the private space: %s", e, exc_info=True)
         # Create a fallback interface to show the connection error
+        with gr.Blocks() as demo:
+            gr.Markdown("# 🎬 DubIndic - Connection Error")
+            gr.Textbox(
+                value=f"Failed to connect to the Hugging Face Space. Please ensure the Space is running and the token is correct. Error: {e}",
+                label="Error",
+                interactive=False
+            )
         return demo
     # Define wrapper functions to call the API endpoints
     def start_processing(audio_file, target_language):
         if not audio_file or not target_language:
             return (
+                "Please provide both an audio file and a target language.",
+                None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
         try:
             logger.info("Calling /process_audio_pipeline_step1 with file: %s", audio_file)
             result = client.predict(
                 audio_file=handle_file(audio_file),
                 api_name="/process_audio_pipeline_step1"
             )
             logger.info("Received result from step 1: %s", result)
+            # API returns a 7-element tuple, we map it to our UI outputs
+            # [status, internal_val, orig_audio, trans, transl, dubbed_audio, progress]
             return (
+                result[0], result[2], result[3], result[4], result[5], result[6],
+                gr.update(visible=True), gr.update(visible=True) # Make edit and merge sections visible
             )
         except Exception as e:
             logger.error("Error in start_processing: %s", e, exc_info=True)
             return (
+                f"Error starting the process: {e}",
+                None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
     def navigate_chunk(transcription, translation, direction):
+        # The API uses different endpoints for next/previous navigation
+        # We assume /lambda is for previous and /lambda_1 is for next
         api_to_call = "/lambda" if direction == "prev" else "/lambda_1"
         try:
             logger.info("Calling %s to navigate.", api_to_call)
+            result = client.predict(
+                t=transcription,
+                tr=translation,
+                api_name=api_to_call
+            )
             logger.info("Received result from navigation: %s", result)
+            # API returns a 6-element tuple
+            # [internal_val, orig_audio, trans, transl, dubbed_audio, progress]
             return result[1], result[2], result[3], result[4], result[5]
         except Exception as e:
             logger.error("Error navigating chunks: %s", e, exc_info=True)
+            return None, f"Error navigating chunks: {e}", "", None, ""
     def generate_dubbed_chunk(transcription, translation):
         if not transcription and not translation:
             return None
         try:
             logger.info("Calling /generate_dubbed_chunk.")
             dubbed_path = client.predict(
                 transcription=transcription,
                 translation=translation,
                 api_name="/generate_dubbed_chunk"
             )
             logger.info("Received dubbed chunk: %s", dubbed_path)
             return dubbed_path
         except Exception as e:
             logger.error("Error generating dubbed chunk: %s", e, exc_info=True)
             return None
     def finalize_current_chunk():
             logger.info("Calling /finalize_current_chunk.")
             progress = client.predict(api_name="/finalize_current_chunk")
             logger.info("Received finalization progress: %s", progress)
+            return progress
         except Exception as e:
             logger.error("Error finalizing chunk: %s", e, exc_info=True)
+            return f"Error finalizing chunk: {e}"
     def merge_all_chunks():
         try:
             logger.info("Calling /merge_audio_files.")
             final_status, final_audio = client.predict(api_name="/merge_audio_files")
             logger.info("Received final merged audio.")
+            return final_status, final_audio
         except Exception as e:
             logger.error("Error merging audio files: %s", e, exc_info=True)
+            return f"Error merging audio: {e}", None
+    # Create custom theme with orange-red gradient colors
+    custom_theme = gr_themes.Soft(
+        primary_hue="orange",
+        secondary_hue="red",
+        neutral_hue="gray"
+    ).set(
+        button_primary_background_fill="linear-gradient(45deg, #f97316, #ef4444)",
+        button_primary_background_fill_hover="linear-gradient(45deg, #ea580c, #dc2626)",
+        button_primary_text_color="white",
+        block_background_fill="rgba(255, 255, 255, 0.05)",
+        block_border_color="rgba(249, 115, 22, 0.2)",
+        input_background_fill="rgba(255, 255, 255, 0.9)",
+        input_border_color="rgba(249, 115, 22, 0.3)",
+        input_border_color_focus="rgba(239, 68, 68, 0.6)"
+    )
+    # Define the Gradio Interface using Blocks for a custom layout
+    with gr.Blocks(theme=custom_theme, title="DubIndic - AI Audio Dubbing", css="""
+        .gradio-container {
+            background: linear-gradient(135deg, rgba(249, 115, 22, 0.1), rgba(239, 68, 68, 0.1));
+        }
+        .gr-button[variant="primary"] {
+            background: linear-gradient(45deg, #f97316, #ef4444) !important;
+            border: none !important;
+            color: white !important;
+            font-weight: bold !important;
+        }
+        .gr-button[variant="primary"]:hover {
+            background: linear-gradient(45deg, #ea580c, #dc2626) !important;
+            transform: translateY(-1px);
+            box-shadow: 0 4px 8px rgba(239, 68, 68, 0.3);
+        }
+        .gr-button[variant="secondary"] {
+            background: linear-gradient(45deg, rgba(249, 115, 22, 0.1), rgba(239, 68, 68, 0.1)) !important;
+            border: 2px solid #f97316 !important;
+            color: #f97316 !important;
+            font-weight: bold !important;
+        }
+        .gr-button[variant="secondary"]:hover {
+            background: linear-gradient(45deg, #f97316, #ef4444) !important;
+            color: white !important;
+        }
+        h1 {
+            background: linear-gradient(45deg, #f97316, #ef4444);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+            font-weight: bold;
+        }
+        .gr-textbox {
+            border: 2px solid rgba(249, 115, 22, 0.3) !important;
+        }
+        .gr-textbox:focus {
+            border-color: #ef4444 !important;
+            box-shadow: 0 0 0 3px rgba(239, 68, 68, 0.1) !important;
+        }
+    """) as demo:
+        gr.Markdown("# 🎬 DubIndic - AI Audio Dubbing Pipeline")
+        gr.Markdown("Transform your audio into another Indian language with full editing control.")
+        with gr.Row():
+            with gr.Column(scale=1):
+                gr.Markdown("### 📤 Step 1: Upload & Configure")
                 audio_input = gr.Audio(sources=["upload"], type="filepath", label="🎵 Upload Audio File")
                 lang_dropdown = gr.Dropdown(
                     choices=["Assamese", "Bengali", "Gujarati", "Hindi", "Kannada", "Malayalam", "Marathi", "Odia", "Punjabi", "Tamil", "Telugu"],
                     label="🌐 Target Language"
                 )
+                process_btn = gr.Button("🎯 Start Processing", variant="primary")
+        step1_output = gr.Textbox(label="📊 Processing Status", interactive=False)
+        with gr.Column(visible=False) as edit_section:
+            gr.Markdown("### ✏️ Step 2: Edit, Generate & Finalize Chunks")
             with gr.Row():
                 prev_btn = gr.Button("◀️ Previous")
                 next_btn = gr.Button("Next ▶️")
+            original_audio = gr.Audio(label="Original Chunk Audio", type="filepath", interactive=False)
+            transcription_text = gr.Textbox(label="Transcription (edit if needed)", lines=2, interactive=True)
+            translation_text = gr.Textbox(label="Translation (edit if needed)", lines=2, interactive=True)
             with gr.Row():
+                generate_btn = gr.Button("🔊 Generate Dubbed Chunk")
                 finalize_btn = gr.Button("✔️ Finalize Chunk", variant="secondary")
+            dubbed_audio = gr.Audio(label="Dubbed Chunk Audio", type="filepath", interactive=False)
+            progress_text = gr.Textbox(label="Progress", interactive=False)
+        with gr.Row(visible=False) as merge_section:
             gr.Markdown("### 🏁 Step 3: Merge Final Audio")
             merge_btn = gr.Button("🚀 Merge All Finalized Chunks", variant="primary")
+        final_output = gr.Textbox(label="🎉 Final Results", interactive=False)
+        output_audio = gr.Audio(label="🔊 Final Dubbed Audio", type="filepath", interactive=False)
         # Connect functions to UI components
         process_btn.click(
             inputs=[audio_input, lang_dropdown],
             outputs=[step1_output, original_audio, transcription_text, translation_text, dubbed_audio, progress_text, edit_section, merge_section]
         )
         prev_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "prev"),
             inputs=[transcription_text, translation_text],
             outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         next_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "next"),
             inputs=[transcription_text, translation_text],
             outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         generate_btn.click(
             fn=generate_dubbed_chunk,
             inputs=[transcription_text, translation_text],
             outputs=[dubbed_audio]
         )
         finalize_btn.click(
             fn=finalize_current_chunk,
             inputs=[],
             outputs=[progress_text]
         )
         merge_btn.click(
             fn=merge_all_chunks,
             inputs=[],
             outputs=[final_output, output_audio]
         )
     return demo
 if __name__ == "__main__":
+    DubIndic_interface = create_DubIndic_interface()
+    if DubIndic_interface:
+        DubIndic_interface.launch(show_error=True, share=False, server_name="0.0.0.0", server_port=7860)
     else:
         logger.error("Failed to create the Gradio interface.")