lshzhm commited on
Commit
8a95680
·
verified ·
1 Parent(s): 68cfefc

Upload 4 files

Browse files
Files changed (3) hide show
  1. app.py +2 -15
  2. tts.sh +1 -1
  3. v2a.sh +2 -2
app.py CHANGED
@@ -33,19 +33,11 @@ video_to_audio_tab = gr.Interface(
33
  fn=video_to_audio,
34
  description="""
35
  Project page: <a href="https://hkchengrex.com/MMAudio/">https://hkchengrex.com/MMAudio/</a><br>
36
- Code: <a href="https://github.com/hkchengrex/MMAudio">https://github.com/hkchengrex/MMAudio</a><br>
37
- NOTE: It takes longer to process high-resolution videos (>384 px on the shorter side).
38
- Doing so does not improve results.
39
- The model has been trained on 8-second videos. Using much longer or shorter videos will degrade performance. Around 5s~12s should be fine.
40
- """,
41
  inputs=[
42
  gr.Video(),
43
  gr.Text(label='Prompt'),
44
- gr.Text(label='Negative prompt', value='music'),
45
- gr.Number(label='Seed (-1: random)', value=-1, precision=0, minimum=-1),
46
- gr.Number(label='Num steps', value=25, precision=0, minimum=1),
47
- gr.Number(label='Guidance Strength', value=4.5, minimum=1),
48
- gr.Number(label='Duration (sec)', value=8, minimum=1),
49
  ],
50
  outputs='playable_video',
51
  cache_examples=False,
@@ -53,12 +45,7 @@ video_to_audio_tab = gr.Interface(
53
  examples=[
54
  [
55
  'https://huggingface.co/hkchengrex/MMAudio/resolve/main/examples/sora_beach.mp4',
56
- 'waves, seagulls',
57
  '',
58
- 0,
59
- 25,
60
- 4.5,
61
- 10,
62
  ],
63
  ])
64
 
 
33
  fn=video_to_audio,
34
  description="""
35
  Project page: <a href="https://hkchengrex.com/MMAudio/">https://hkchengrex.com/MMAudio/</a><br>
36
+ Code: <a href="https://github.com/acappemin/DeepAudio-V1">https://github.com/acappemin/DeepAudio-V1</a><br>
37
+ """
 
 
 
38
  inputs=[
39
  gr.Video(),
40
  gr.Text(label='Prompt'),
 
 
 
 
 
41
  ],
42
  outputs='playable_video',
43
  cache_examples=False,
 
45
  examples=[
46
  [
47
  'https://huggingface.co/hkchengrex/MMAudio/resolve/main/examples/sora_beach.mp4',
 
48
  '',
 
 
 
 
49
  ],
50
  ])
51
 
tts.sh CHANGED
@@ -1 +1 @@
1
- python ./F5-TTS/src/f5_tts/infer/infer_cli_tts_test.py --output_dir ./tests/outputs_tts/ --start 0 --end 10 --ckpt_file ./F5-TTS/ckpts/v2c/v2c_l44.pt --infer_list ./tests/tts_test.lst
 
1
+ python ./F5-TTS/src/f5_tts/infer/infer_cli_tts_test.py --output_dir ./tests/outputs_tts/ --start 0 --end 10 --ckpt_file ./F5-TTS/ckpts/v2c/v2c_l44.pt --infer_list ./tests/tts_test.lst
v2a.sh CHANGED
@@ -1,2 +1,2 @@
1
- cd ./MMAudio
2
- python ./demo.py --output ../tests/outputs_v2a_l44_test/ --start 0 --end 10 --scp ../tests/test.scp --calc_energy 1
 
1
+ cd ./MMAudio
2
+ python ./demo.py --output ../tests/outputs_v2a_l44_test/ --start 0 --end 10 --scp ../tests/test.scp --calc_energy 1