Spaces:
Runtime error
Runtime error
handling max_new_token errors.
Browse files
app.py
CHANGED
@@ -41,6 +41,9 @@ llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
|
|
41 |
model_type="llama",
|
42 |
# config = ctransformers.hub.AutoConfig,
|
43 |
# hf = True
|
|
|
|
|
|
|
44 |
)
|
45 |
|
46 |
|
@@ -157,5 +160,5 @@ gr.Interface(
|
|
157 |
description="This app facilitates a conversation with PDFs available on https://www.delo.si/assets/media/other/20110728/100%20Weird%20Facts%20About%20the%20Human%20Body.pdf💡",
|
158 |
theme="soft",
|
159 |
examples=["Hello", "what is the speed of human nerve impulses?"],
|
160 |
-
cache_examples=True,
|
161 |
).launch()
|
|
|
41 |
model_type="llama",
|
42 |
# config = ctransformers.hub.AutoConfig,
|
43 |
# hf = True
|
44 |
+
temperature = 0.2,
|
45 |
+
max_new_tokens = 1024,
|
46 |
+
stop = ['\n']
|
47 |
)
|
48 |
|
49 |
|
|
|
160 |
description="This app facilitates a conversation with PDFs available on https://www.delo.si/assets/media/other/20110728/100%20Weird%20Facts%20About%20the%20Human%20Body.pdf💡",
|
161 |
theme="soft",
|
162 |
examples=["Hello", "what is the speed of human nerve impulses?"],
|
163 |
+
# cache_examples=True,
|
164 |
).launch()
|