Spaces:
				
			
			
	
			
			
		Runtime error
		
	
	
	
			
			
	
	
	
	
		
		
		Runtime error
		
	
		Musa
		
	commited on
		
		
					Commit 
							
							·
						
						27ccf6a
	
1
								Parent(s):
							
							d12d70f
								
Update app.py
Browse files
    	
        app.py
    CHANGED
    
    | @@ -19,6 +19,10 @@ config = Config() | |
| 19 | 
             
            logging.getLogger("numba").setLevel(logging.WARNING)
         | 
| 20 | 
             
            limitation = os.getenv("SYSTEM") == "spaces"  # limit audio length in huggingface spaces
         | 
| 21 |  | 
|  | |
|  | |
|  | |
|  | |
| 22 | 
             
            def create_vc_fn(tgt_sr, net_g, vc, if_f0, file_index):
         | 
| 23 | 
             
                def vc_fn(
         | 
| 24 | 
             
                    input_audio,
         | 
| @@ -74,20 +78,6 @@ def create_vc_fn(tgt_sr, net_g, vc, if_f0, file_index): | |
| 74 | 
             
                        return info, (None, None)
         | 
| 75 | 
             
                return vc_fn
         | 
| 76 |  | 
| 77 | 
            -
            def load_hubert():
         | 
| 78 | 
            -
                global hubert_model
         | 
| 79 | 
            -
                models, _, _ = checkpoint_utils.load_model_ensemble_and_task(
         | 
| 80 | 
            -
                    ["hubert_base.pt"],
         | 
| 81 | 
            -
                    suffix="",
         | 
| 82 | 
            -
                )
         | 
| 83 | 
            -
                hubert_model = models[0]
         | 
| 84 | 
            -
                hubert_model = hubert_model.to(config.device)
         | 
| 85 | 
            -
                if config.is_half:
         | 
| 86 | 
            -
                    hubert_model = hubert_model.half()
         | 
| 87 | 
            -
                else:
         | 
| 88 | 
            -
                    hubert_model = hubert_model.float()
         | 
| 89 | 
            -
                hubert_model.eval()
         | 
| 90 | 
            -
             | 
| 91 | 
             
            def change_to_tts_mode(tts_mode):
         | 
| 92 | 
             
                if tts_mode:
         | 
| 93 | 
             
                    return gr.Audio.update(visible=False), gr.Textbox.update(visible=True), gr.Dropdown.update(visible=True)
         | 
| @@ -97,8 +87,12 @@ def change_to_tts_mode(tts_mode): | |
| 97 | 
             
            if __name__ == '__main__':
         | 
| 98 | 
             
                load_hubert()
         | 
| 99 | 
             
                models = []
         | 
|  | |
| 100 | 
             
                tts_voice_list = asyncio.get_event_loop().run_until_complete(edge_tts.list_voices())
         | 
| 101 | 
             
                voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
         | 
|  | |
|  | |
|  | |
| 102 | 
             
                if limitation:
         | 
| 103 | 
             
                    with open("weights/model_info.json", "r", encoding="utf-8") as f:
         | 
| 104 | 
             
                        models_info = json.load(f)
         | 
|  | |
| 19 | 
             
            logging.getLogger("numba").setLevel(logging.WARNING)
         | 
| 20 | 
             
            limitation = os.getenv("SYSTEM") == "spaces"  # limit audio length in huggingface spaces
         | 
| 21 |  | 
| 22 | 
            +
            # Load the whisper_large_v2 interface
         | 
| 23 | 
            +
            whisper_interface = gr.Interface.load("models/openai/whisper-large-v2")
         | 
| 24 | 
            +
             | 
| 25 | 
            +
             | 
| 26 | 
             
            def create_vc_fn(tgt_sr, net_g, vc, if_f0, file_index):
         | 
| 27 | 
             
                def vc_fn(
         | 
| 28 | 
             
                    input_audio,
         | 
|  | |
| 78 | 
             
                        return info, (None, None)
         | 
| 79 | 
             
                return vc_fn
         | 
| 80 |  | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
| 81 | 
             
            def change_to_tts_mode(tts_mode):
         | 
| 82 | 
             
                if tts_mode:
         | 
| 83 | 
             
                    return gr.Audio.update(visible=False), gr.Textbox.update(visible=True), gr.Dropdown.update(visible=True)
         | 
|  | |
| 87 | 
             
            if __name__ == '__main__':
         | 
| 88 | 
             
                load_hubert()
         | 
| 89 | 
             
                models = []
         | 
| 90 | 
            +
             | 
| 91 | 
             
                tts_voice_list = asyncio.get_event_loop().run_until_complete(edge_tts.list_voices())
         | 
| 92 | 
             
                voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
         | 
| 93 | 
            +
             | 
| 94 | 
            +
                # Add the whisper_large_v2 model to the models list
         | 
| 95 | 
            +
                models.append(("Whisper v2", "Whisper v2", "OpenAI", None, whisper_interface))
         | 
| 96 | 
             
                if limitation:
         | 
| 97 | 
             
                    with open("weights/model_info.json", "r", encoding="utf-8") as f:
         | 
| 98 | 
             
                        models_info = json.load(f)
         | 
 
			
