Update README.md
Browse files
README.md
CHANGED
@@ -16,7 +16,9 @@ from hqq.engine.hf import HQQModelForCausalLM, AutoTokenizer
|
|
16 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
17 |
model = HQQModelForCausalLM.from_quantized(model_id)
|
18 |
|
19 |
-
|
|
|
|
|
20 |
|
21 |
#Text Generation
|
22 |
prompt = "<s> [INST] How do I build a car? [/INST] "
|
|
|
16 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
17 |
model = HQQModelForCausalLM.from_quantized(model_id)
|
18 |
|
19 |
+
#Optional
|
20 |
+
from hqq.core.quantize import *
|
21 |
+
HQQLinear.set_backend(HQQBackend.PYTORCH_COMPILE)
|
22 |
|
23 |
#Text Generation
|
24 |
prompt = "<s> [INST] How do I build a car? [/INST] "
|