Spaces:

Tamiloneto8
/

Oneto8-test

Sleeping

App Files Files Community

Tamiloneto8 commited on Jul 30

Commit

1b65561

verified ·

1 Parent(s): 274120f

Update app.py

Browse files

Files changed (1) hide show

app.py +80 -17

app.py CHANGED Viewed

@@ -37,7 +37,7 @@ def create_DubIndic_interface():
         if not audio_file or not target_language:
             return (
                 "Please provide both an audio file and a target language.",
-                None, "", "", None, "", None,
                 gr.update(visible=False), gr.update(visible=False)
             )
         try:
@@ -48,20 +48,24 @@ def create_DubIndic_interface():
                 api_name="/process_audio_pipeline_step1"
             )
             logger.info("Received result from step 1: %s", result)
             # [status, internal_val, orig_audio, trans, transl, dubbed_audio, progress]
             return (
-                result[0], result[2], result[3], result[4], result[5], result[6], result[2],
-                gr.update(visible=True), gr.update(visible=True)
             )
         except Exception as e:
             logger.error("Error in start_processing: %s", e, exc_info=True)
             return (
                 f"Error starting the process: {e}",
-                None, "", "", None, "", None,
                 gr.update(visible=False), gr.update(visible=False)
             )
     def navigate_chunk(transcription, translation, direction):
         api_to_call = "/lambda" if direction == "prev" else "/lambda_1"
         try:
             logger.info("Calling %s to navigate.", api_to_call)
@@ -70,11 +74,13 @@ def create_DubIndic_interface():
                 tr=translation,
                 api_name=api_to_call
             )
             # [internal_val, orig_audio, trans, transl, dubbed_audio, progress]
-            return result[1], result[2], result[3], result[4], result[5], result[1]
         except Exception as e:
             logger.error("Error navigating chunks: %s", e, exc_info=True)
-            return None, f"Error navigating chunks: {e}", "", None, "", None
     def generate_dubbed_chunk(transcription, translation):
         if not transcription and not translation:
@@ -86,6 +92,7 @@ def create_DubIndic_interface():
                 translation=translation,
                 api_name="/generate_dubbed_chunk"
             )
             return dubbed_path
         except Exception as e:
             logger.error("Error generating dubbed chunk: %s", e, exc_info=True)
@@ -93,7 +100,9 @@ def create_DubIndic_interface():
     def finalize_current_chunk():
         try:
             progress = client.predict(api_name="/finalize_current_chunk")
             return progress
         except Exception as e:
             logger.error("Error finalizing chunk: %s", e, exc_info=True)
@@ -101,12 +110,15 @@ def create_DubIndic_interface():
     def merge_all_chunks():
         try:
             final_status, final_audio = client.predict(api_name="/merge_audio_files")
             return final_status, final_audio
         except Exception as e:
             logger.error("Error merging audio files: %s", e, exc_info=True)
             return f"Error merging audio: {e}", None
     custom_theme = gr_themes.Soft(
         primary_hue="orange",
         secondary_hue="red",
@@ -115,11 +127,57 @@ def create_DubIndic_interface():
         button_primary_background_fill="linear-gradient(45deg, #f97316, #ef4444)",
         button_primary_background_fill_hover="linear-gradient(45deg, #ea580c, #dc2626)",
         button_primary_text_color="white",
     )
-    with gr.Blocks(theme=custom_theme, title="DubIndic - AI Audio Dubbing") as demo:
         gr.Markdown("# 🎬 DubIndic - AI Audio Dubbing Pipeline")
         with gr.Row():
             with gr.Column(scale=1):
                 gr.Markdown("### 📤 Step 1: Upload & Configure")
@@ -129,16 +187,15 @@ def create_DubIndic_interface():
                     label="🌐 Target Language"
                 )
                 process_btn = gr.Button("🎯 Start Processing", variant="primary")
         step1_output = gr.Textbox(label="📊 Processing Status", interactive=False)
         with gr.Column(visible=False) as edit_section:
             gr.Markdown("### ✏️ Step 2: Edit, Generate & Finalize Chunks")
             with gr.Row():
                 prev_btn = gr.Button("◀️ Previous")
                 next_btn = gr.Button("Next ▶️")
             original_audio = gr.Audio(label="Original Chunk Audio", type="filepath", interactive=False)
-            download_original = gr.DownloadButton(label="💾 Download Original Chunk", file=None)
             transcription_text = gr.Textbox(label="Transcription (edit if needed)", lines=2, interactive=True)
             translation_text = gr.Textbox(label="Translation (edit if needed)", lines=2, interactive=True)
             with gr.Row():
@@ -146,11 +203,11 @@ def create_DubIndic_interface():
                 finalize_btn = gr.Button("✔️ Finalize Chunk", variant="secondary")
             dubbed_audio = gr.Audio(label="Dubbed Chunk Audio", type="filepath", interactive=False)
             progress_text = gr.Textbox(label="Progress", interactive=False)
         with gr.Row(visible=False) as merge_section:
             gr.Markdown("### 🏁 Step 3: Merge Final Audio")
             merge_btn = gr.Button("🚀 Merge All Finalized Chunks", variant="primary")
         final_output = gr.Textbox(label="🎉 Final Results", interactive=False)
         output_audio = gr.Audio(label="🔊 Final Dubbed Audio", type="filepath", interactive=False)
@@ -158,33 +215,39 @@ def create_DubIndic_interface():
         process_btn.click(
             fn=start_processing,
             inputs=[audio_input, lang_dropdown],
-            outputs=[step1_output, original_audio, transcription_text, translation_text, dubbed_audio, progress_text, download_original, edit_section, merge_section]
         )
         prev_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "prev"),
             inputs=[transcription_text, translation_text],
-            outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text, download_original]
         )
         next_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "next"),
             inputs=[transcription_text, translation_text],
-            outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text, download_original]
         )
         generate_btn.click(
             fn=generate_dubbed_chunk,
             inputs=[transcription_text, translation_text],
             outputs=[dubbed_audio]
         )
         finalize_btn.click(
             fn=finalize_current_chunk,
             inputs=[],
             outputs=[progress_text]
         )
         merge_btn.click(
             fn=merge_all_chunks,
             inputs=[],
             outputs=[final_output, output_audio]
         )
     return demo
 if __name__ == "__main__":
@@ -192,4 +255,4 @@ if __name__ == "__main__":
     if DubIndic_interface:
         DubIndic_interface.launch(show_error=True, share=False, server_name="0.0.0.0", server_port=7860)
     else:
-        logger.error("Failed to create the Gradio interface.")

         if not audio_file or not target_language:
             return (
                 "Please provide both an audio file and a target language.",
+                None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
         try:
                 api_name="/process_audio_pipeline_step1"
             )
             logger.info("Received result from step 1: %s", result)
+            # API returns a 7-element tuple, we map it to our UI outputs
             # [status, internal_val, orig_audio, trans, transl, dubbed_audio, progress]
             return (
+                result[0], result[2], result[3], result[4], result[5], result[6],
+                gr.update(visible=True), gr.update(visible=True) # Make edit and merge sections visible
             )
         except Exception as e:
             logger.error("Error in start_processing: %s", e, exc_info=True)
             return (
                 f"Error starting the process: {e}",
+                None, "", "", None, "",
                 gr.update(visible=False), gr.update(visible=False)
             )
     def navigate_chunk(transcription, translation, direction):
+        # The API uses different endpoints for next/previous navigation
+        # We assume /lambda is for previous and /lambda_1 is for next
         api_to_call = "/lambda" if direction == "prev" else "/lambda_1"
         try:
             logger.info("Calling %s to navigate.", api_to_call)
                 tr=translation,
                 api_name=api_to_call
             )
+            logger.info("Received result from navigation: %s", result)
+            # API returns a 6-element tuple
             # [internal_val, orig_audio, trans, transl, dubbed_audio, progress]
+            return result[1], result[2], result[3], result[4], result[5]
         except Exception as e:
             logger.error("Error navigating chunks: %s", e, exc_info=True)
+            return None, f"Error navigating chunks: {e}", "", None, ""
     def generate_dubbed_chunk(transcription, translation):
         if not transcription and not translation:
                 translation=translation,
                 api_name="/generate_dubbed_chunk"
             )
+            logger.info("Received dubbed chunk: %s", dubbed_path)
             return dubbed_path
         except Exception as e:
             logger.error("Error generating dubbed chunk: %s", e, exc_info=True)
     def finalize_current_chunk():
         try:
+            logger.info("Calling /finalize_current_chunk.")
             progress = client.predict(api_name="/finalize_current_chunk")
+            logger.info("Received finalization progress: %s", progress)
             return progress
         except Exception as e:
             logger.error("Error finalizing chunk: %s", e, exc_info=True)
     def merge_all_chunks():
         try:
+            logger.info("Calling /merge_audio_files.")
             final_status, final_audio = client.predict(api_name="/merge_audio_files")
+            logger.info("Received final merged audio.")
             return final_status, final_audio
         except Exception as e:
             logger.error("Error merging audio files: %s", e, exc_info=True)
             return f"Error merging audio: {e}", None
+    # Create custom theme with orange-red gradient colors
     custom_theme = gr_themes.Soft(
         primary_hue="orange",
         secondary_hue="red",
         button_primary_background_fill="linear-gradient(45deg, #f97316, #ef4444)",
         button_primary_background_fill_hover="linear-gradient(45deg, #ea580c, #dc2626)",
         button_primary_text_color="white",
+        block_background_fill="rgba(255, 255, 255, 0.05)",
+        block_border_color="rgba(249, 115, 22, 0.2)",
+        input_background_fill="rgba(255, 255, 255, 0.9)",
+        input_border_color="rgba(249, 115, 22, 0.3)",
+        input_border_color_focus="rgba(239, 68, 68, 0.6)"
     )
+    # Define the Gradio Interface using Blocks for a custom layout
+    with gr.Blocks(theme=custom_theme, title="DubIndic - AI Audio Dubbing", css="""
+        .gradio-container {
+            background: linear-gradient(135deg, rgba(249, 115, 22, 0.1), rgba(239, 68, 68, 0.1));
+        }
+        .gr-button[variant="primary"] {
+            background: linear-gradient(45deg, #f97316, #ef4444) !important;
+            border: none !important;
+            color: white !important;
+            font-weight: bold !important;
+        }
+        .gr-button[variant="primary"]:hover {
+            background: linear-gradient(45deg, #ea580c, #dc2626) !important;
+            transform: translateY(-1px);
+            box-shadow: 0 4px 8px rgba(239, 68, 68, 0.3);
+        }
+        .gr-button[variant="secondary"] {
+            background: linear-gradient(45deg, rgba(249, 115, 22, 0.1), rgba(239, 68, 68, 0.1)) !important;
+            border: 2px solid #f97316 !important;
+            color: #f97316 !important;
+            font-weight: bold !important;
+        }
+        .gr-button[variant="secondary"]:hover {
+            background: linear-gradient(45deg, #f97316, #ef4444) !important;
+            color: white !important;
+        }
+        h1 {
+            background: linear-gradient(45deg, #f97316, #ef4444);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            background-clip: text;
+            font-weight: bold;
+        }
+        .gr-textbox {
+            border: 2px solid rgba(249, 115, 22, 0.3) !important;
+        }
+        .gr-textbox:focus {
+            border-color: #ef4444 !important;
+            box-shadow: 0 0 0 3px rgba(239, 68, 68, 0.1) !important;
+        }
+    """) as demo:
         gr.Markdown("# 🎬 DubIndic - AI Audio Dubbing Pipeline")
+        gr.Markdown("Transform your audio into another Indian language with full editing control.")
         with gr.Row():
             with gr.Column(scale=1):
                 gr.Markdown("### 📤 Step 1: Upload & Configure")
                     label="🌐 Target Language"
                 )
                 process_btn = gr.Button("🎯 Start Processing", variant="primary")
         step1_output = gr.Textbox(label="📊 Processing Status", interactive=False)
         with gr.Column(visible=False) as edit_section:
             gr.Markdown("### ✏️ Step 2: Edit, Generate & Finalize Chunks")
             with gr.Row():
                 prev_btn = gr.Button("◀️ Previous")
                 next_btn = gr.Button("Next ▶️")
             original_audio = gr.Audio(label="Original Chunk Audio", type="filepath", interactive=False)
             transcription_text = gr.Textbox(label="Transcription (edit if needed)", lines=2, interactive=True)
             translation_text = gr.Textbox(label="Translation (edit if needed)", lines=2, interactive=True)
             with gr.Row():
                 finalize_btn = gr.Button("✔️ Finalize Chunk", variant="secondary")
             dubbed_audio = gr.Audio(label="Dubbed Chunk Audio", type="filepath", interactive=False)
             progress_text = gr.Textbox(label="Progress", interactive=False)
         with gr.Row(visible=False) as merge_section:
             gr.Markdown("### 🏁 Step 3: Merge Final Audio")
             merge_btn = gr.Button("🚀 Merge All Finalized Chunks", variant="primary")
         final_output = gr.Textbox(label="🎉 Final Results", interactive=False)
         output_audio = gr.Audio(label="🔊 Final Dubbed Audio", type="filepath", interactive=False)
         process_btn.click(
             fn=start_processing,
             inputs=[audio_input, lang_dropdown],
+            outputs=[step1_output, original_audio, transcription_text, translation_text, dubbed_audio, progress_text, edit_section, merge_section]
         )
         prev_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "prev"),
             inputs=[transcription_text, translation_text],
+            outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         next_btn.click(
             fn=lambda t, tr: navigate_chunk(t, tr, "next"),
             inputs=[transcription_text, translation_text],
+            outputs=[original_audio, transcription_text, translation_text, dubbed_audio, progress_text]
         )
         generate_btn.click(
             fn=generate_dubbed_chunk,
             inputs=[transcription_text, translation_text],
             outputs=[dubbed_audio]
         )
         finalize_btn.click(
             fn=finalize_current_chunk,
             inputs=[],
             outputs=[progress_text]
         )
         merge_btn.click(
             fn=merge_all_chunks,
             inputs=[],
             outputs=[final_output, output_audio]
         )
     return demo
 if __name__ == "__main__":
     if DubIndic_interface:
         DubIndic_interface.launch(show_error=True, share=False, server_name="0.0.0.0", server_port=7860)
     else:
+        logger.error("Failed to create the Gradio interface.")