mobinln commited on
Commit
fca7347
1 Parent(s): 8926d1f

change settings

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -4,9 +4,9 @@ from llama_cpp import Llama
4
  model = "Qwen/Qwen2-7B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
- filename="qwen2-7b-instruct-q4_k_m.gguf",
8
  verbose=True,
9
- use_mmap=False,
10
  use_mlock=True,
11
  n_threads=2,
12
  n_threads_batch=2,
@@ -39,6 +39,7 @@ def respond(
39
  stream=True,
40
  temperature=temperature,
41
  top_p=top_p,
 
42
  )
43
 
44
  for message in completion:
 
4
  model = "Qwen/Qwen2-7B-Instruct-GGUF"
5
  llm = Llama.from_pretrained(
6
  repo_id=model,
7
+ filename="qwen2-7b-instruct-q4_0.gguf",
8
  verbose=True,
9
+ use_mmap=True,
10
  use_mlock=True,
11
  n_threads=2,
12
  n_threads_batch=2,
 
39
  stream=True,
40
  temperature=temperature,
41
  top_p=top_p,
42
+ echo=False
43
  )
44
 
45
  for message in completion: