Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: "transformers.js"
|
3 |
+
base_model: Felladrin/llama2_xs_460M_experimental_evol_instruct
|
4 |
+
---
|
5 |
+
|
6 |
+
INT8 ONNX version of [Felladrin/llama2_xs_460M_experimental_evol_instruct](https://huggingface.co/Felladrin/llama2_xs_460M_experimental_evol_instruct) to use with [Transformers.js](https://huggingface.co/docs/transformers.js).
|
7 |
+
|
8 |
+
### Example usage
|
9 |
+
#### Pipeline API
|
10 |
+
```js
|
11 |
+
import { pipeline } from '@xenova/transformers';
|
12 |
+
|
13 |
+
const generator = await pipeline('text-generation', 'Felladrin/onnx-int8-llama2_xs_460M_experimental_evol_instruct');
|
14 |
+
const output = await generator('Once upon a time,', { add_special_tokens: true, max_new_tokens: 60, repetition_penalty: 1.2});
|
15 |
+
console.log(output);
|
16 |
+
```
|
17 |
+
|
18 |
+
#### Auto Classes
|
19 |
+
```js
|
20 |
+
import { AutoModelForCausalLM, AutoTokenizer } from '@xenova/transformers';
|
21 |
+
|
22 |
+
const model_path = 'Felladrin/onnx-int8-llama2_xs_460M_experimental_evol_instruct';
|
23 |
+
const model = await AutoModelForCausalLM.from_pretrained(model_path);
|
24 |
+
const tokenizer = await AutoTokenizer.from_pretrained(model_path);
|
25 |
+
|
26 |
+
const prompt = 'Once upon a time,';
|
27 |
+
const { input_ids } = tokenizer(prompt);
|
28 |
+
const tokens = await model.generate(input_ids, { max_new_tokens: 60, repetition_penalty: 1.2});
|
29 |
+
console.log(tokenizer.decode(tokens[0], { skip_special_tokens: true }));
|
30 |
+
```
|
31 |
+
|