ampvgq12 / app.py
s12144251's picture
Create app.py
82b0ff6 verified
import gradio as gr
# ุชุนุฑูŠู ุงู„ู†ู…ุงุฐุฌ
models = {
"Whisper Small": "openai/whisper-small.en",
"Wav2Vec2": "facebook/wav2vec2-base-960h"
}
# ุชุญู…ูŠู„ ุงู„ู†ู…ุงุฐุฌ ู…ู† Hugging Face
whisper = gr.Interface.load(f"huggingface/{models['Whisper Small']}")
wav2vec = gr.Interface.load(f"huggingface/{models['Wav2Vec2']}")
# ุฏุงู„ุฉ ุชุญูˆูŠู„ ุงู„ุตูˆุช ู„ู†ุต ุจุงุณุชุฎุฏุงู… ุงู„ู†ู…ูˆุฐุฌูŠู†
def transcribe_with_all(audio_path):
whisper_result = whisper(audio_path)
wav2vec_result = wav2vec(audio_path)
return whisper_result, wav2vec_result
# ูˆุงุฌู‡ุฉ ุงู„ู…ู‚ุงุฑู†ุฉ ุจุงุณุชุฎุฏุงู… Gradio
with gr.Blocks() as demo:
gr.Markdown("# ๐Ÿ—ฃ๏ธ Speech Recognition Model Comparison")
gr.Markdown("ู‚ุงุฑู† ุจูŠู† ู†ุชุงุฆุฌ ุชุญูˆูŠู„ ุงู„ุตูˆุช ุฅู„ู‰ ู†ุต ู…ู† ู†ู…ูˆุฐุฌูŠู† ู…ุฎุชู„ููŠู†")
audio_input = gr.Audio(type="filepath", label="๐ŸŽง ุฃุฏุฎู„ ู…ู„ู ุตูˆุชูŠ")
transcribe_btn = gr.Button("๐Ÿ” ุญูˆู‘ู„ ุงู„ู†ุต")
with gr.Row():
with gr.Column():
gr.Markdown("### Whisper Small (OpenAI)")
whisper_output = gr.Textbox(label="ุงู„ู†ุต ุงู„ู†ุงุชุฌ ู…ู† Whisper")
with gr.Column():
gr.Markdown("### Wav2Vec2 (Facebook)")
wav2vec_output = gr.Textbox(label="ุงู„ู†ุต ุงู„ู†ุงุชุฌ ู…ู† Wav2Vec2")
transcribe_btn.click(
fn=transcribe_with_all,
inputs=audio_input,
outputs=[whisper_output, wav2vec_output]
)
# ุชุดุบูŠู„ ุงู„ุชุทุจูŠู‚
demo.launch()