Spaces:

CreitinGameplays
/

ConvAIChat

Paused

CreitinGameplays commited on May 19

Commit

89a382b

•

1 Parent(s): 88185d8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
 DESCRIPTION = "# ConvAI 9b"
 if not torch.cuda.is_available():
     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
@@ -20,7 +21,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 if torch.cuda.is_available():
     model_id = "CreitinGameplays/ConvAI-9b"
-    model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto")
     tokenizer = AutoTokenizer.from_pretrained(model_id)
 @spaces.GPU

 from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
 DESCRIPTION = "# ConvAI 9b"
+hf_token = os.getenv("hf_token")
 if not torch.cuda.is_available():
     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
 if torch.cuda.is_available():
     model_id = "CreitinGameplays/ConvAI-9b"
+    model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto", auth_token=hf_token)
     tokenizer = AutoTokenizer.from_pretrained(model_id)
 @spaces.GPU