change settings
Browse files
app.py
CHANGED
@@ -4,9 +4,9 @@ from llama_cpp import Llama
|
|
4 |
model = "Qwen/Qwen2-7B-Instruct-GGUF"
|
5 |
llm = Llama.from_pretrained(
|
6 |
repo_id=model,
|
7 |
-
filename="qwen2-7b-instruct-
|
8 |
verbose=True,
|
9 |
-
use_mmap=
|
10 |
use_mlock=True,
|
11 |
n_threads=2,
|
12 |
n_threads_batch=2,
|
@@ -39,6 +39,7 @@ def respond(
|
|
39 |
stream=True,
|
40 |
temperature=temperature,
|
41 |
top_p=top_p,
|
|
|
42 |
)
|
43 |
|
44 |
for message in completion:
|
|
|
4 |
model = "Qwen/Qwen2-7B-Instruct-GGUF"
|
5 |
llm = Llama.from_pretrained(
|
6 |
repo_id=model,
|
7 |
+
filename="qwen2-7b-instruct-q4_0.gguf",
|
8 |
verbose=True,
|
9 |
+
use_mmap=True,
|
10 |
use_mlock=True,
|
11 |
n_threads=2,
|
12 |
n_threads_batch=2,
|
|
|
39 |
stream=True,
|
40 |
temperature=temperature,
|
41 |
top_p=top_p,
|
42 |
+
echo=False
|
43 |
)
|
44 |
|
45 |
for message in completion:
|