Spaces:
Running
Running
Upload 4 files
Browse files
app.py
CHANGED
@@ -33,19 +33,11 @@ video_to_audio_tab = gr.Interface(
|
|
33 |
fn=video_to_audio,
|
34 |
description="""
|
35 |
Project page: <a href="https://hkchengrex.com/MMAudio/">https://hkchengrex.com/MMAudio/</a><br>
|
36 |
-
Code: <a href="https://github.com/
|
37 |
-
|
38 |
-
Doing so does not improve results.
|
39 |
-
The model has been trained on 8-second videos. Using much longer or shorter videos will degrade performance. Around 5s~12s should be fine.
|
40 |
-
""",
|
41 |
inputs=[
|
42 |
gr.Video(),
|
43 |
gr.Text(label='Prompt'),
|
44 |
-
gr.Text(label='Negative prompt', value='music'),
|
45 |
-
gr.Number(label='Seed (-1: random)', value=-1, precision=0, minimum=-1),
|
46 |
-
gr.Number(label='Num steps', value=25, precision=0, minimum=1),
|
47 |
-
gr.Number(label='Guidance Strength', value=4.5, minimum=1),
|
48 |
-
gr.Number(label='Duration (sec)', value=8, minimum=1),
|
49 |
],
|
50 |
outputs='playable_video',
|
51 |
cache_examples=False,
|
@@ -53,12 +45,7 @@ video_to_audio_tab = gr.Interface(
|
|
53 |
examples=[
|
54 |
[
|
55 |
'https://huggingface.co/hkchengrex/MMAudio/resolve/main/examples/sora_beach.mp4',
|
56 |
-
'waves, seagulls',
|
57 |
'',
|
58 |
-
0,
|
59 |
-
25,
|
60 |
-
4.5,
|
61 |
-
10,
|
62 |
],
|
63 |
])
|
64 |
|
|
|
33 |
fn=video_to_audio,
|
34 |
description="""
|
35 |
Project page: <a href="https://hkchengrex.com/MMAudio/">https://hkchengrex.com/MMAudio/</a><br>
|
36 |
+
Code: <a href="https://github.com/acappemin/DeepAudio-V1">https://github.com/acappemin/DeepAudio-V1</a><br>
|
37 |
+
"""
|
|
|
|
|
|
|
38 |
inputs=[
|
39 |
gr.Video(),
|
40 |
gr.Text(label='Prompt'),
|
|
|
|
|
|
|
|
|
|
|
41 |
],
|
42 |
outputs='playable_video',
|
43 |
cache_examples=False,
|
|
|
45 |
examples=[
|
46 |
[
|
47 |
'https://huggingface.co/hkchengrex/MMAudio/resolve/main/examples/sora_beach.mp4',
|
|
|
48 |
'',
|
|
|
|
|
|
|
|
|
49 |
],
|
50 |
])
|
51 |
|
tts.sh
CHANGED
@@ -1 +1 @@
|
|
1 |
-
python ./F5-TTS/src/f5_tts/infer/infer_cli_tts_test.py --output_dir ./tests/outputs_tts/ --start 0 --end 10 --ckpt_file ./F5-TTS/ckpts/v2c/v2c_l44.pt --infer_list ./tests/tts_test.lst
|
|
|
1 |
+
python ./F5-TTS/src/f5_tts/infer/infer_cli_tts_test.py --output_dir ./tests/outputs_tts/ --start 0 --end 10 --ckpt_file ./F5-TTS/ckpts/v2c/v2c_l44.pt --infer_list ./tests/tts_test.lst
|
v2a.sh
CHANGED
@@ -1,2 +1,2 @@
|
|
1 |
-
cd ./MMAudio
|
2 |
-
python ./demo.py --output ../tests/outputs_v2a_l44_test/ --start 0 --end 10 --scp ../tests/test.scp --calc_energy 1
|
|
|
1 |
+
cd ./MMAudio
|
2 |
+
python ./demo.py --output ../tests/outputs_v2a_l44_test/ --start 0 --end 10 --scp ../tests/test.scp --calc_energy 1
|