herMaster commited on
Commit
f005fdc
1 Parent(s): 486c196

handling max_new_token errors.

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -41,6 +41,9 @@ llm = AutoModelForCausalLM.from_pretrained("TheBloke/Llama-2-7B-Chat-GGUF",
41
  model_type="llama",
42
  # config = ctransformers.hub.AutoConfig,
43
  # hf = True
 
 
 
44
  )
45
 
46
 
@@ -157,5 +160,5 @@ gr.Interface(
157
  description="This app facilitates a conversation with PDFs available on https://www.delo.si/assets/media/other/20110728/100%20Weird%20Facts%20About%20the%20Human%20Body.pdf💡",
158
  theme="soft",
159
  examples=["Hello", "what is the speed of human nerve impulses?"],
160
- cache_examples=True,
161
  ).launch()
 
41
  model_type="llama",
42
  # config = ctransformers.hub.AutoConfig,
43
  # hf = True
44
+ temperature = 0.2,
45
+ max_new_tokens = 1024,
46
+ stop = ['\n']
47
  )
48
 
49
 
 
160
  description="This app facilitates a conversation with PDFs available on https://www.delo.si/assets/media/other/20110728/100%20Weird%20Facts%20About%20the%20Human%20Body.pdf💡",
161
  theme="soft",
162
  examples=["Hello", "what is the speed of human nerve impulses?"],
163
+ # cache_examples=True,
164
  ).launch()