ShoufaChen commited on
Commit
b7f8141
1 Parent(s): e61c6be

low memory

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -44,7 +44,7 @@ def load_model(args):
44
  llm = LLM(
45
  args=args,
46
  model='serve/fake_json/{}.json'.format(args.gpt_model),
47
- gpu_memory_utilization=0.6,
48
  skip_tokenizer_init=True)
49
  print(f"gpt model is loaded")
50
  return vq_model, llm, image_size
 
44
  llm = LLM(
45
  args=args,
46
  model='serve/fake_json/{}.json'.format(args.gpt_model),
47
+ gpu_memory_utilization=0.5,
48
  skip_tokenizer_init=True)
49
  print(f"gpt model is loaded")
50
  return vq_model, llm, image_size