Upload optimized ONNX model
Browse files- config.json +0 -3
- onnx/model_fp16.onnx +2 -2
- onnx/model_q4f16.onnx +2 -2
config.json
CHANGED
@@ -30,11 +30,8 @@
|
|
30 |
"use_gated_mlp": false,
|
31 |
"value_bias": true,
|
32 |
"transformers.js_config": {
|
33 |
-
"dtype": "fp32",
|
34 |
"use_external_data_format": {
|
35 |
-
"model.onnx": 1,
|
36 |
"model_fp16.onnx": 1,
|
37 |
-
"model_q4.onnx": 1,
|
38 |
"model_q4f16.onnx": 1
|
39 |
}
|
40 |
}
|
|
|
30 |
"use_gated_mlp": false,
|
31 |
"value_bias": true,
|
32 |
"transformers.js_config": {
|
|
|
33 |
"use_external_data_format": {
|
|
|
34 |
"model_fp16.onnx": 1,
|
|
|
35 |
"model_q4f16.onnx": 1
|
36 |
}
|
37 |
}
|
onnx/model_fp16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68c469fbb716f9e146f6c751b34eec034ca776ffad0b5bc5c252f01a2f8291d2
|
3 |
+
size 262860
|
onnx/model_q4f16.onnx
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e17695c4a1d7e20c21e0e76ba9a9b0575c8c8d336f83fb403c44a731e4bcf15d
|
3 |
+
size 288141
|