Edge_TTS_NGHIA_transcript

Running

cnph001 commited on Apr 27

Commit

44c7b6f

verified ·

1 Parent(s): a4e47b1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,31 @@ import re  # Import the regular expression module
 from pathlib import Path
 from pydub import AudioSegment
 # Get all available voices
 async def get_voices():
@@ -45,10 +69,8 @@ async def paragraph_to_speech(text, voice, rate, pitch):
                 print(f"Silence.mp3 file found at {SILENCE_PATH} and is inserted")
             else:
                 print(f"Silence.mp3 file NOT FOUND")
-                silent_audio = AudioSegment.silent(duration=1000)
-                with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
-                     silent_audio.export(tmp_file.name, format="mp3")
-                audio_segments.append(tmp_file.name)
         elif part.strip():
             processed_text = part

 from pathlib import Path
 from pydub import AudioSegment
+def get_silence(duration_ms=1000):
+    # Create silent audio segment with specified parameters
+    silent_audio = AudioSegment.silent(
+        duration=duration_ms,
+        frame_rate=24000  # 24kHz sampling rate
+    )
+    # Set audio parameters
+    silent_audio = silent_audio.set_channels(1)  # Mono
+    silent_audio = silent_audio.set_sample_width(4)  # 32-bit (4 bytes per sample)
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
+        # Export with specific bitrate and codec parameters
+        silent_audio.export(
+            tmp_file.name,
+            format="mp3",
+            bitrate="48k",
+            parameters=[
+                "-ac", "1",  # Mono
+                "-ar", "24000",  # Sample rate
+                "-sample_fmt", "s32",  # 32-bit samples
+                "-codec:a", "libmp3lame"  # MP3 codec
+            ]
+        )
+        return tmp_file.name
 # Get all available voices
 async def get_voices():
                 print(f"Silence.mp3 file found at {SILENCE_PATH} and is inserted")
             else:
                 print(f"Silence.mp3 file NOT FOUND")
+                silence_file_path = get_silence(5000)  # Store the returned filename
+                audio_segments.append(silence_file_path)  # Use the stored filename
         elif part.strip():
             processed_text = part