pvduy commited on
Commit
53b40bf
1 Parent(s): babdb31

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -10
app.py CHANGED
@@ -54,19 +54,17 @@ def predict(message, history, system_prompt, temperature, max_tokens):
54
  outputs = []
55
  for text in streamer:
56
  outputs.append(text)
57
- stop = False
58
- for tok in stop_tokens:
59
- if tok in text:
60
- stop = True
61
- break
62
- if stop:
63
- yield "".join(outputs)
64
  break
 
 
 
 
65
 
66
  if __name__ == "__main__":
67
  args = parse_args()
68
- tokenizer = AutoTokenizer.from_pretrained("stabilityai/stablelm-2-12b-chat", trust_remote_code=True)
69
- model = AutoModelForCausalLM.from_pretrained("stabilityai/stablelm-2-12b-chat", trust_remote_code=True, torch_dtype=torch.bfloat16)
70
  device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
71
  model = model.to(device)
72
  gr.ChatInterface(
@@ -85,4 +83,4 @@ if __name__ == "__main__":
85
  gr.Slider(100, 2048, 1024, label="Max Tokens"),
86
  ],
87
  additional_inputs_accordion_name="Parameters",
88
- ).queue().launch()
 
54
  outputs = []
55
  for text in streamer:
56
  outputs.append(text)
57
+ if text in stop_tokens:
 
 
 
 
 
 
58
  break
59
+ print(text)
60
+ yield "".join(outputs)
61
+
62
+
63
 
64
  if __name__ == "__main__":
65
  args = parse_args()
66
+ tokenizer = AutoTokenizer.from_pretrained("stabilityai/stablelm-2-chat", trust_remote_code=True)
67
+ model = AutoModelForCausalLM.from_pretrained("stabilityai/stablelm-2-chat", trust_remote_code=True, torch_dtype=torch.bfloat16)
68
  device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
69
  model = model.to(device)
70
  gr.ChatInterface(
 
83
  gr.Slider(100, 2048, 1024, label="Max Tokens"),
84
  ],
85
  additional_inputs_accordion_name="Parameters",
86
+ ).queue().launch()