Add/update the quantized ONNX model files and README.md for Transformers.js v3 (#4)
Browse files- Add/update the quantized ONNX model files and README.md for Transformers.js v3 (38e389d993107afc513366b35e28ea5f37ab4f09)
Co-authored-by: Yuichiro Tachibana <[email protected]>
- README.md +3 -3
- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +2 -2
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_q4f16.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_q4f16.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_q4f16.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
- onnx/encoder_model_bnb4.onnx +3 -0
- onnx/encoder_model_int8.onnx +3 -0
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_q4f16.onnx +3 -0
- onnx/encoder_model_uint8.onnx +3 -0
README.md
CHANGED
@@ -9,14 +9,14 @@ https://huggingface.co/facebook/nllb-200-distilled-600M with ONNX weights to be
|
|
9 |
|
10 |
## Usage (Transformers.js)
|
11 |
|
12 |
-
If you haven't already, you can install the [Transformers.js](https://huggingface.co/docs/transformers.js) JavaScript library from [NPM](https://www.npmjs.com/package/@
|
13 |
```bash
|
14 |
-
npm i @
|
15 |
```
|
16 |
|
17 |
You can then perform multilingual translation like this:
|
18 |
```js
|
19 |
-
import { pipeline } from '@
|
20 |
|
21 |
// Create a translation pipeline
|
22 |
const translator = await pipeline('translation', 'Xenova/nllb-200-distilled-600M');
|
|
|
9 |
|
10 |
## Usage (Transformers.js)
|
11 |
|
12 |
+
If you haven't already, you can install the [Transformers.js](https://huggingface.co/docs/transformers.js) JavaScript library from [NPM](https://www.npmjs.com/package/@huggingface/transformers) using:
|
13 |
```bash
|
14 |
+
npm i @huggingface/transformers
|
15 |
```
|
16 |
|
17 |
You can then perform multilingual translation like this:
|
18 |
```js
|
19 |
+
import { pipeline } from '@huggingface/transformers';
|
20 |
|
21 |
// Create a translation pipeline
|
22 |
const translator = await pipeline('translation', 'Xenova/nllb-200-distilled-600M');
|
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3abedf31204e30205a54a35a016e769066ee80de87478833c726d766d54ea8f0
|
3 |
+
size 1168344350
|
onnx/decoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca4c8cea6faf3acfec6ac9a8e2dbcb12deb95617e39a3eeeabc575c41e9ed5a6
|
3 |
+
size 930453274
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34765d44fe475f81b98efa2f7452bc742f7fdfb6b553af18a23ae6ee5ee92049
|
3 |
+
size 1515755203
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a9b4ee5434115dd1610fa96c3aaec9a4654ee814f9c8c865b5f020211820b61
|
3 |
+
size 1168915076
|
onnx/decoder_model_merged_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51b0ee4d7bfa43013e48c1858b255b5e17bca112914b122fae3e4178b4000ed4
|
3 |
+
size 931025511
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40e5985f77652809304c8c002fb50e4ecedad457edf2589eef69591574a0782c
|
3 |
+
size 1516432837
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbea01de69bf0f342d67d035bceb7baa3c25b31213c54e4a630a92554684a293
|
3 |
+
size 1181496152
|
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edd56698a6779a0b66564db3375c6b7cd3fd584cfda4f54177bb2a8bc46fee19
|
3 |
+
size 641649334
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce477adf6c08c103c5b1d38581d4a28934aeb8c0a4662399ee7c5d05d14bd227
|
3 |
+
size 1516432902
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4855f26e7e251aff2e9152dd004a0c6e139ba2bd320b0f3d3834b69db5d43b0
|
3 |
+
size 1180926290
|
onnx/decoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c7c33071a9f719248cd1cb799d3b8d5e07b9c30e84a73e3ab38be53265154a1
|
3 |
+
size 641063897
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28c74e11b8453a1ad9657b2525ce564e8e78e30feccb993122f2e15afb14c8b2
|
3 |
+
size 1515755268
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d48e295399d10b1a401f16ab6bf90413e95b6f90b160139c69244de74c787db
|
3 |
+
size 1153955682
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cc04c98db49e532dbfa5aa9c8b31e01375faea1a58de89826c3b6ce199669ea
|
3 |
+
size 879951078
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a081e3f9a77e142bb0f01d0b8039530247db4eab4cd894218353e9b755631cd1
|
3 |
+
size 1490336684
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8639ee384dc5cb11a9277b748a3859f78cc40095ad565d6ad2722ad1e0824eb4
|
3 |
+
size 1164964950
|
onnx/decoder_with_past_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722f62f1dbb071a4a18540ef2eeb1de174a4b9a43f437e99ec4bfdd54fe7f89f
|
3 |
+
size 626734069
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9f39b5c72875362459124252f82659de428e0818996bfa6400d0c3b96105cf0
|
3 |
+
size 1490336738
|
onnx/encoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0699e77b8f225aa4577c37f9ccda8046d821459eaf4b1ce4e39353d69813de3d
|
3 |
+
size 1139440339
|
onnx/encoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da9234723304e9f76216b67a43ede4fe65393cbf5942a7e4a84595782a4bc161
|
3 |
+
size 415346576
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad7ead9b72b01c3c86f474dd2a895be224e36799f89b09c8da9d8c2d41603aa6
|
3 |
+
size 1148876935
|
onnx/encoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46952b3df2924d4db8204a179f183c0c3836cf8af54a224b7b1daa60374e6f57
|
3 |
+
size 612305403
|
onnx/encoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08b857ca2045dc74b39dadc3b18e686d10389d22424d46f85d10010451a83c42
|
3 |
+
size 415346625
|