gxy commited on
Commit
d01da2d
1 Parent(s): 555032a

Update launch.py

Browse files
Files changed (1) hide show
  1. launch.py +1 -1
launch.py CHANGED
@@ -33,7 +33,7 @@ lm_model = LlamaForCausalLM.from_pretrained(
33
  device_map="auto",
34
  torch_dtype=torch.float16,
35
  use_auth_token=AUTH_TOKEN,
36
- quantization_config=BitsAndBytesConfig(load_in_8bit=True))
37
  tokenizer = LlamaTokenizer.from_pretrained(LM_MODEL_PATH, use_auth_token=AUTH_TOKEN)
38
 
39
  # visual model
 
33
  device_map="auto",
34
  torch_dtype=torch.float16,
35
  use_auth_token=AUTH_TOKEN,
36
+ quantization_config=BitsAndBytesConfig(load_in_4bit=True))
37
  tokenizer = LlamaTokenizer.from_pretrained(LM_MODEL_PATH, use_auth_token=AUTH_TOKEN)
38
 
39
  # visual model