tiantiaf commited on
Commit
1b122c7
·
verified ·
1 Parent(s): a585e16

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -2
README.md CHANGED
@@ -70,8 +70,11 @@ english_accent_list = [
70
  'South African', 'Southeast Asia', 'South Asia', 'Welsh'
71
  ]
72
 
73
- # Load data, here just zeros as the example, audio data should be 16kHz mono channel
74
- data = torch.zeros([1, 16000]).float().to(device)
 
 
 
75
  logits, embeddings = model(data, return_feature=True)
76
 
77
  # Probability and output
 
70
  'South African', 'Southeast Asia', 'South Asia', 'Welsh'
71
  ]
72
 
73
+ # Load data, here just zeros as the example
74
+ # Our training data filters output audio shorter than 3 seconds (unreliable predictions) and longer than 15 seconds (computation limitation)
75
+ # So you need to prepare your audio to a maximum of 15 seconds, 16kHz and mono channel
76
+ max_audio_length = 15 * 16000
77
+ data = torch.zeros([1, 16000]).float().to(device)[:, :max_audio_length]
78
  logits, embeddings = model(data, return_feature=True)
79
 
80
  # Probability and output