minhdang commited on
Commit
179b4d7
1 Parent(s): d67e122

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -25,7 +25,8 @@ tokenizer = AutoTokenizer.from_pretrained(model_id)
25
  model = AutoModelForCausalLM.from_pretrained(model_id,
26
  # load_in_8bit=True,
27
  quantization_config=nf4_config,
28
- torch_dtype = torch.bfloat16,
 
29
  device_map="auto"
30
  )
31
 
 
25
  model = AutoModelForCausalLM.from_pretrained(model_id,
26
  # load_in_8bit=True,
27
  quantization_config=nf4_config,
28
+ attn_implementation="flash_attention_2",
29
+ # torch_dtype = torch.bfloat16,
30
  device_map="auto"
31
  )
32