Add/update the quantized ONNX model files and README.md for Transformers.js v3 (#3)
Browse files- Add/update the quantized ONNX model files and README.md for Transformers.js v3 (6e234b76aa96d066ae8ef8f48497291df9464ce4)
Co-authored-by: Yuichiro Tachibana <whitphx@users.noreply.huggingface.co>
- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_fp16.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +2 -2
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_q4f16.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_q4f16.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_q4f16.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
- onnx/encoder_model_bnb4.onnx +3 -0
- onnx/encoder_model_int8.onnx +3 -0
- onnx/encoder_model_q4.onnx +3 -0
- onnx/encoder_model_q4f16.onnx +3 -0
- onnx/encoder_model_uint8.onnx +3 -0
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcb2c85568120ca2a1140bd0fee6f2e91de91d37f4043dc1bf2e8b9d5bb79724
|
3 |
+
size 144643802
|
onnx/decoder_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e09d3c1e8cedbf6df8094b2e38ad06370e8439a573c0c2c38c2ecdf1ec8994e8
|
3 |
+
size 115703222
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5586116a2be6c6929fbaecf38ccf0ee8dde91ec46ebbee7b7895d826e1265284
|
3 |
+
size 187102282
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:235ec7eb47dde3ded11ce3c77336f22259990d2fe1476b42abbc9658bbf9a58f
|
3 |
+
size 144901491
|
onnx/decoder_model_merged_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d394d59fb0ff5d032d179d954c12a650c60785c60228586a57e405ff61814d19
|
3 |
+
size 116131279
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e782fb4f915303df4bcbded070eb4fb7cbd2b58103c6d04654e265f6334d4f0e
|
3 |
+
size 58894845
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d823c4f6f5a93436b2a3039f6a88c5d06b2f5bed4c646ccad73586438b94ec9d
|
3 |
+
size 146473443
|
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86b5e285ecde54b946900e560e61a2be2a64bd79c76b6b49802b8ad744b6a431
|
3 |
+
size 79962830
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1669ad2513a3f08b6370ba6e97d44c490c690efc5ff2e57c2058e71a2e7df1bf
|
3 |
+
size 58894872
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f74b524de40a6c45e599f3673f8287e24e84068153116a0956d0585949b7a97
|
3 |
+
size 146216186
|
onnx/decoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce019bec97fefed0cc4c29984d897c8777a8105e618100be0e91f7859175784b
|
3 |
+
size 79536297
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43190b5566c5083e661c8cc405e313a048c8855558722fd363411ba5db7b9dad
|
3 |
+
size 187102309
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3efe47989a90cf66159a711439bf9b18d45a41c2cc5a7a541d6d99cb2e3307fe
|
3 |
+
size 142781030
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8cb5da70fde687d9610396e7e6262c88b5110bb9101b1851db9c7b752ef0cce
|
3 |
+
size 109337270
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bde78142688a70aefce0ac365de325cc6cc9b6051ed1e6f993957ab98e90952
|
3 |
+
size 183853221
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec3e94cf7a66346ee23ed2b217322231e0bf910ace5b8dd856c94bf31ef4709b
|
3 |
+
size 144156902
|
onnx/decoder_with_past_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55a8abde1ef0efbd7c49db4233a319db24439af08873c13809ea06413c88286e
|
3 |
+
size 77690541
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0f448cfcfafe42f4143d659a7cbf9e63ea235d42b767848eedeee13b6979aff
|
3 |
+
size 183853243
|
onnx/encoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca82be2df8f82e53fd3bf4bb209fde353df3353b57cceae8f7e44b070718bc44
|
3 |
+
size 140627901
|
onnx/encoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c95b80aad377b35481f5c828b984c5a05a08c5dc97767bea6d219eb80f982e3c
|
3 |
+
size 51617048
|
onnx/encoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30e7fbb9d09b3632fc2f18bebcbc0d309fb1583582bbdebdf1932a274fcf2a28
|
3 |
+
size 141807261
|
onnx/encoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e7d7d35cae5fbd6580c4511b1a4f96d8bc0c56343bd5abf955c0a0396af1462
|
3 |
+
size 75681825
|
onnx/encoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80097df1f8134385b624984698b6a19ebff6858e3d6549e9ad6c76ce5e64c48f
|
3 |
+
size 51617067
|