bweng commited on
Commit
8571dd7
·
verified ·
1 Parent(s): 5cf3dfe

Upload 5 files

Browse files
Embedding.mlmodelc/analytics/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b2449667626ef30bbcf9aad719b8ad5380aab470e3c3bddf5ece68c101cfd5c
3
  size 243
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d6706436639b53830b4dbe8aaf9c9a843f7f582d63e16f3cb8bb7c6ccd58682
3
  size 243
Embedding.mlmodelc/coremldata.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8af46b5ba390f4e1898446f30c318d19f114410e91bd4e2a30839ad3900e3f12
3
- size 646
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a705bac27d151d9642f37609296042a15602a42253039e0921dc9e75da7e004
3
+ size 704
Embedding.mlmodelc/metadata.json CHANGED
@@ -1,6 +1,6 @@
1
  [
2
  {
3
- "shortDescription" : "pyannote community-1 speaker embedding (10 s WeSpeaker ResNet34, packed audio+weights input, interpolates 589-frame weights to pooling layer size internally)",
4
  "metadataOutputVersion" : "3.0",
5
  "outputSchema" : [
6
  {
@@ -20,33 +20,26 @@
20
  ],
21
  "author" : "Fluid Inference",
22
  "specificationVersion" : 8,
23
- "storagePrecision" : "Mixed (Float32, Int8)",
24
  "license" : "CC-BY-4.0",
25
  "mlProgramOperationTypeHistogram" : {
26
- "Ios16.reduceL2Norm" : 1,
27
- "Ios17.reshape" : 6,
28
- "Ios16.reduceMean" : 2,
29
- "Ios17.transpose" : 2,
30
- "Ios17.expandDims" : 10,
31
- "Ios17.add" : 20,
32
- "Ios17.sliceByIndex" : 3,
33
- "Ios16.reduceSum" : 4,
34
- "Ios17.squeeze" : 5,
35
- "Ios17.gather" : 2,
36
- "Pad" : 2,
37
- "Ios17.log" : 1,
38
- "Ios16.constexprAffineDequantize" : 40,
39
  "Ios17.sqrt" : 1,
40
- "Ios17.sub" : 5,
41
- "Ios17.conv" : 41,
42
- "Ios17.clip" : 3,
43
- "Ios16.relu" : 33,
44
- "Ios17.pow" : 2,
45
- "Ios17.realDiv" : 4,
46
  "Ios17.concat" : 1,
47
- "Ios17.mul" : 9
 
 
 
 
 
 
 
 
 
48
  },
49
- "computePrecision" : "Mixed (Float32, Int32)",
50
  "stateSchema" : [
51
 
52
  ],
@@ -67,22 +60,34 @@
67
  "dataType" : "Float32",
68
  "hasShapeFlexibility" : "1",
69
  "isOptional" : "0",
70
- "shapeFlexibility" : "1...32 × 1 × 1 × 160589",
71
- "shapeRange" : "[[1, 32], [1, 1], [1, 1], [160589, 160589]]",
72
- "formattedType" : "MultiArray (Float32 1 × 1 × 1 × 160589)",
 
 
 
 
 
 
 
 
 
 
 
 
73
  "type" : "MultiArray",
74
- "shape" : "[1, 1, 1, 160589]",
75
- "name" : "audio_and_weights",
76
  "shortDescription" : ""
77
  }
78
  ],
79
  "userDefinedMetadata" : {
80
- "com.github.apple.coremltools.conversion_date" : "2025-10-13",
81
  "com.github.apple.coremltools.source" : "torch==2.8.0",
82
  "com.github.apple.coremltools.version" : "9.0b1",
83
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
84
  },
85
- "generatedClassName" : "embedding_community_1_int8_per_channel",
86
  "method" : "predict"
87
  }
88
  ]
 
1
  [
2
  {
3
+ "shortDescription" : "pyannote community-1 speaker embedding backend (WeSpeaker ResNet34 consuming 80×998 FBANK features + 589-frame weights, interpolates weights to 125-frame pooling layer internally)",
4
  "metadataOutputVersion" : "3.0",
5
  "outputSchema" : [
6
  {
 
20
  ],
21
  "author" : "Fluid Inference",
22
  "specificationVersion" : 8,
23
+ "storagePrecision" : "Float16",
24
  "license" : "CC-BY-4.0",
25
  "mlProgramOperationTypeHistogram" : {
26
+ "Ios17.mul" : 4,
 
 
 
 
 
 
 
 
 
 
 
 
27
  "Ios17.sqrt" : 1,
28
+ "Ios17.sub" : 2,
29
+ "Ios17.conv" : 38,
 
 
 
 
30
  "Ios17.concat" : 1,
31
+ "Ios17.clip" : 2,
32
+ "Ios17.add" : 18,
33
+ "Ios17.realDiv" : 4,
34
+ "Ios16.relu" : 33,
35
+ "Ios17.expandDims" : 7,
36
+ "Ios16.reduceSum" : 4,
37
+ "Ios16.reduceL2Norm" : 1,
38
+ "Ios17.squeeze" : 2,
39
+ "Ios17.reshape" : 2,
40
+ "Ios17.cast" : 5
41
  },
42
+ "computePrecision" : "Mixed (Float16, Float32, Int32)",
43
  "stateSchema" : [
44
 
45
  ],
 
60
  "dataType" : "Float32",
61
  "hasShapeFlexibility" : "1",
62
  "isOptional" : "0",
63
+ "shapeFlexibility" : "1...32 × 1 × 80 × 998",
64
+ "shapeRange" : "[[1, 32], [1, 1], [80, 80], [998, 998]]",
65
+ "formattedType" : "MultiArray (Float32 1 × 1 × 80 × 998)",
66
+ "type" : "MultiArray",
67
+ "shape" : "[1, 1, 80, 998]",
68
+ "name" : "fbank_features",
69
+ "shortDescription" : ""
70
+ },
71
+ {
72
+ "dataType" : "Float32",
73
+ "hasShapeFlexibility" : "1",
74
+ "isOptional" : "0",
75
+ "shapeFlexibility" : "1...32 × 589",
76
+ "shapeRange" : "[[1, 32], [589, 589]]",
77
+ "formattedType" : "MultiArray (Float32 1 × 589)",
78
  "type" : "MultiArray",
79
+ "shape" : "[1, 589]",
80
+ "name" : "weights",
81
  "shortDescription" : ""
82
  }
83
  ],
84
  "userDefinedMetadata" : {
85
+ "com.github.apple.coremltools.conversion_date" : "2025-10-16",
86
  "com.github.apple.coremltools.source" : "torch==2.8.0",
87
  "com.github.apple.coremltools.version" : "9.0b1",
88
  "com.github.apple.coremltools.source_dialect" : "TorchScript"
89
  },
90
+ "generatedClassName" : "embedding_community_1",
91
  "method" : "predict"
92
  }
93
  ]
Embedding.mlmodelc/model.mil CHANGED
The diff for this file is too large to render. See raw diff
 
Embedding.mlmodelc/weights/weight.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ffc18432c23faf3d6b233c85e859876b3aaf0f1557cd4432bb24b8881eddecc
3
- size 7124224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99356b2985b8d43880a657024d941d450b38820451ccff903f76ed4e52d1868b
3
+ size 13412288