Spaces:
Runtime error
Runtime error
JenkinsGage
commited on
Commit
•
051be48
1
Parent(s):
7c8f24b
Update app.py
Browse files
app.py
CHANGED
@@ -5,7 +5,7 @@ from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
|
|
5 |
|
6 |
tokenizer = AutoTokenizer.from_pretrained('humarin/chatgpt_paraphraser_on_T5_base', cache_dir='./Models')
|
7 |
model = AutoModelForSeq2SeqLM.from_pretrained('humarin/chatgpt_paraphraser_on_T5_base', cache_dir='./Models')
|
8 |
-
|
9 |
|
10 |
def paraphrase(
|
11 |
text,
|
@@ -25,7 +25,7 @@ def paraphrase(
|
|
25 |
truncation=True,
|
26 |
).input_ids
|
27 |
|
28 |
-
outputs =
|
29 |
input_ids, temperature=temperature, repetition_penalty=repetition_penalty,
|
30 |
num_return_sequences=num_return_sequences, no_repeat_ngram_size=no_repeat_ngram_size,
|
31 |
num_beams=num_beams, num_beam_groups=num_beam_groups,
|
|
|
5 |
|
6 |
tokenizer = AutoTokenizer.from_pretrained('humarin/chatgpt_paraphraser_on_T5_base', cache_dir='./Models')
|
7 |
model = AutoModelForSeq2SeqLM.from_pretrained('humarin/chatgpt_paraphraser_on_T5_base', cache_dir='./Models')
|
8 |
+
model_quant = torch.quantization.quantize_dynamic(model, {torch.nn.Linear}, dtype=torch.qint8)
|
9 |
|
10 |
def paraphrase(
|
11 |
text,
|
|
|
25 |
truncation=True,
|
26 |
).input_ids
|
27 |
|
28 |
+
outputs = model_quant.generate(
|
29 |
input_ids, temperature=temperature, repetition_penalty=repetition_penalty,
|
30 |
num_return_sequences=num_return_sequences, no_repeat_ngram_size=no_repeat_ngram_size,
|
31 |
num_beams=num_beams, num_beam_groups=num_beam_groups,
|