Add/update the quantized ONNX model files and README.md for Transformers.js v3 (#2)
Browse files- Add/update the quantized ONNX model files and README.md for Transformers.js v3 (b00d6b85e10c0401bf2e6c141a8f531190a56ded)
Co-authored-by: Yuichiro Tachibana <[email protected]>
- README.md +4 -4
- onnx/decoder_model_bnb4.onnx +3 -0
- onnx/decoder_model_int8.onnx +3 -0
- onnx/decoder_model_merged_bnb4.onnx +3 -0
- onnx/decoder_model_merged_fp16.onnx +3 -0
- onnx/decoder_model_merged_int8.onnx +3 -0
- onnx/decoder_model_merged_q4.onnx +3 -0
- onnx/decoder_model_merged_q4f16.onnx +3 -0
- onnx/decoder_model_merged_uint8.onnx +3 -0
- onnx/decoder_model_q4.onnx +3 -0
- onnx/decoder_model_q4f16.onnx +3 -0
- onnx/decoder_model_uint8.onnx +3 -0
- onnx/decoder_with_past_model_bnb4.onnx +3 -0
- onnx/decoder_with_past_model_fp16.onnx +3 -0
- onnx/decoder_with_past_model_int8.onnx +3 -0
- onnx/decoder_with_past_model_q4.onnx +3 -0
- onnx/decoder_with_past_model_q4f16.onnx +3 -0
- onnx/decoder_with_past_model_uint8.onnx +3 -0
README.md
CHANGED
@@ -6,15 +6,15 @@ tags:
|
|
6 |
|
7 |
## Usage (Transformers.js)
|
8 |
|
9 |
-
If you haven't already, you can install the [Transformers.js](https://huggingface.co/docs/transformers.js) JavaScript library from [NPM](https://www.npmjs.com/package/@
|
10 |
```bash
|
11 |
-
npm i @
|
12 |
```
|
13 |
|
14 |
You can then use the model to generate text like this:
|
15 |
|
16 |
```js
|
17 |
-
import { pipeline } from "@
|
18 |
|
19 |
// Create a text-generation pipeline
|
20 |
const generator = await pipeline('text-generation', 'Xenova/llama2.c-stories110M');
|
@@ -27,4 +27,4 @@ console.log(output);
|
|
27 |
const output2 = await generator(text, { max_new_tokens: 50 });
|
28 |
console.log(output2);
|
29 |
// [{ generated_text: "Once upon a time, there was a little girl named Lily. She loved to play outside in the sunshine. One day, she saw a big, scary dog. She was scared and didn't know what to do. \nSudden" }]
|
30 |
-
```
|
|
|
6 |
|
7 |
## Usage (Transformers.js)
|
8 |
|
9 |
+
If you haven't already, you can install the [Transformers.js](https://huggingface.co/docs/transformers.js) JavaScript library from [NPM](https://www.npmjs.com/package/@huggingface/transformers) using:
|
10 |
```bash
|
11 |
+
npm i @huggingface/transformers
|
12 |
```
|
13 |
|
14 |
You can then use the model to generate text like this:
|
15 |
|
16 |
```js
|
17 |
+
import { pipeline } from "@huggingface/transformers";
|
18 |
|
19 |
// Create a text-generation pipeline
|
20 |
const generator = await pipeline('text-generation', 'Xenova/llama2.c-stories110M');
|
|
|
27 |
const output2 = await generator(text, { max_new_tokens: 50 });
|
28 |
console.log(output2);
|
29 |
// [{ generated_text: "Once upon a time, there was a little girl named Lily. She loved to play outside in the sunshine. One day, she saw a big, scary dog. She was scared and didn't know what to do. \nSudden" }]
|
30 |
+
```
|
onnx/decoder_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48f3ee2a5a9e550375ef584cdafb7d51fd6afe60920df8b2de5d7c4cfded7209
|
3 |
+
size 146956453
|
onnx/decoder_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11edd7dbd7d7ed108038f09f95e0e278e2d344316be413d78420c19f6f57c40f
|
3 |
+
size 110465966
|
onnx/decoder_model_merged_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a123e9b6865e4967e4bf85ccb3228be419af2cd8b25429030127e07b2a2bec0
|
3 |
+
size 147314862
|
onnx/decoder_model_merged_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bb63fabda312fa6d89e04371a76a5e014acb0451af4d984d93508f4a1339bda
|
3 |
+
size 219938798
|
onnx/decoder_model_merged_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fe1f56778f28b8916f076094fb6fccd03c742ff8a8fba43e1cb38f0e09c8730
|
3 |
+
size 110901835
|
onnx/decoder_model_merged_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67fe2925907ee6c0f382d094d41d1bacd7a37d63f00f29b1c5cb8a171d91bfd6
|
3 |
+
size 152621898
|
onnx/decoder_model_merged_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f20fe0429bd4f29caf621eb3e3c46578ab6cf954b7c24127d9bcb0be53d2c5b3
|
3 |
+
size 97868949
|
onnx/decoder_model_merged_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4de80e36618c4b3a6233d48569350cc0f59048f789a8545e251c7d0d9345b0d0
|
3 |
+
size 110901871
|
onnx/decoder_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bf83350acbd3ad454ac72b0649e7952425cd73a300ea387cc28243fae69a39e
|
3 |
+
size 152264245
|
onnx/decoder_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42760b046ed0477fd0c3e7db06f52154c13de814e0f9ddce21057c4cf05afc72
|
3 |
+
size 97504456
|
onnx/decoder_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ab5455480211894bd2a960857493c1613f39b176b0a783c1902011393583a4d
|
3 |
+
size 110466002
|
onnx/decoder_with_past_model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a55d28e1ab4c12776d0c007e76c01ad21064d95cab06db7251710f17f3754d5c
|
3 |
+
size 146935345
|
onnx/decoder_with_past_model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d0683296baa69d310725576b092d7ba5d28a11524ad73e28f7d81f88746620b
|
3 |
+
size 219568820
|
onnx/decoder_with_past_model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d75c879601bf38baacf1958c4e53eed4857f17e84a0e61144b5312475fb471d
|
3 |
+
size 110444858
|
onnx/decoder_with_past_model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39f69ab4571f779776725768877a36a51ffa9a1054cacbefe6a1d1b60da5ebbe
|
3 |
+
size 152243137
|
onnx/decoder_with_past_model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5d8d70deb74214e26f2f850b3f22454f4544b58452386b3d2fd11b69ff148d2
|
3 |
+
size 97487799
|
onnx/decoder_with_past_model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:330ba180bf480d771976e8fa035636a60da5892f3d1f663d66cfb1837a7a6bdf
|
3 |
+
size 110444894
|