benchang1110
commited on
Commit
•
0541848
1
Parent(s):
5d73d5d
Update README.md
Browse files
README.md
CHANGED
@@ -26,8 +26,8 @@ def generate_response():
|
|
26 |
message = [
|
27 |
{'content': prompt, 'role': 'user'},
|
28 |
]
|
29 |
-
formatted_chat = tokenizer.apply_chat_template(
|
30 |
-
_ = model.generate(formatted_chat,streamer=streamer,use_cache=True,max_new_tokens=
|
31 |
|
32 |
if __name__ == '__main__':
|
33 |
device = 'cuda' if torch.cuda.is_available() else 'cpu'
|
|
|
26 |
message = [
|
27 |
{'content': prompt, 'role': 'user'},
|
28 |
]
|
29 |
+
formatted_chat = tokenizer.apply_chat_template(message,tokenize=True,add_generation_prompt=True,return_tensors='pt').to(device)
|
30 |
+
_ = model.generate(formatted_chat,streamer=streamer,use_cache=True,max_new_tokens=1024,do_sample=True)
|
31 |
|
32 |
if __name__ == '__main__':
|
33 |
device = 'cuda' if torch.cuda.is_available() else 'cpu'
|