xnohat commited on
Commit
fda4b89
·
verified ·
1 Parent(s): 55d5c73

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "architectures": [
3
- "SileroVAD"
4
  ],
5
- "model_type": "silero_vad",
6
  "id2label": {
7
  "0": "no_speech",
8
  "1": "speech"
@@ -11,11 +11,8 @@
11
  "no_speech": 0,
12
  "speech": 1
13
  },
 
 
14
  "sampling_rate": 16000,
15
- "threshold": 0.5,
16
- "min_speech_duration_ms": 250,
17
- "min_silence_duration_ms": 100,
18
- "window_size_samples": 512,
19
- "speech_pad_ms": 30,
20
  "transformers_version": "4.30.2"
21
  }
 
1
  {
2
  "architectures": [
3
+ "AutoModelForAudioClassification"
4
  ],
5
+ "model_type": "audio-classification",
6
  "id2label": {
7
  "0": "no_speech",
8
  "1": "speech"
 
11
  "no_speech": 0,
12
  "speech": 1
13
  },
14
+ "hidden_size": 768,
15
+ "num_labels": 2,
16
  "sampling_rate": 16000,
 
 
 
 
 
17
  "transformers_version": "4.30.2"
18
  }
onnx_config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_names": ["input"],
3
+ "output_names": ["logits"],
4
+ "dynamic_axes": {
5
+ "input": {
6
+ "0": "batch_size",
7
+ "1": "sequence_length"
8
+ },
9
+ "logits": {
10
+ "0": "batch_size",
11
+ "1": "num_classes"
12
+ }
13
+ },
14
+ "opset_version": 14,
15
+ "supported_backends": ["onnxruntime", "webgl", "wasm"],
16
+ "quantized": false,
17
+ "model_inputs": [
18
+ {
19
+ "name": "input",
20
+ "shape": [1, -1],
21
+ "dtype": "float32"
22
+ }
23
+ ],
24
+ "model_outputs": [
25
+ {
26
+ "name": "logits",
27
+ "shape": [1, 2],
28
+ "dtype": "float32"
29
+ }
30
+ ],
31
+ "pipeline_tag": "audio-classification",
32
+ "metadata": {
33
+ "transformers_version": "4.30.2",
34
+ "framework": "onnx"
35
+ }
36
+ }
preprocessor_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "feature_extractor_type": "Wav2Vec2FeatureExtractor",
3
  "padding_side": "right",
4
  "sampling_rate": 16000,
5
  "return_attention_mask": true,
 
1
  {
2
+ "feature_extractor_type": "AudioFeatureExtractor",
3
  "padding_side": "right",
4
  "sampling_rate": 16000,
5
  "return_attention_mask": true,
tokenizer_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name_or_path": "facebook/wav2vec2-base",
3
+ "return_attention_mask": true,
4
+ "do_normalize": true,
5
+ "padding": "max_length",
6
+ "max_length": 16000,
7
+ "sampling_rate": 16000,
8
+ "feature_size": 1,
9
+ "padding_value": 0.0,
10
+ "truncation": true
11
+ }