Spaces:

Linly-AI
/

Linly-ChatFlow

Runtime error

yuhaofeng-shiba commited on May 12, 2023

Commit

784d667

•

1 Parent(s): 2598f17

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ def init_args():
     args.config_path = './config/llama_7b.json'
     args.spm_model_path = './model_file/tokenizer.model'
     args.batch_size = 1
-    args.seq_length = 512
     args.world_size = 1
     args.use_int8 = True
     args.top_p = 0
@@ -42,9 +42,6 @@ def init_model():
     model = load_model(model, args.load_model_path)
     model.eval()
-    # for name, parameter in model.named_parameters():
-    #     print(name)
-    #     print(parameter)
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     model.to(device)

     args.config_path = './config/llama_7b.json'
     args.spm_model_path = './model_file/tokenizer.model'
     args.batch_size = 1
+    args.seq_length = 256
     args.world_size = 1
     args.use_int8 = True
     args.top_p = 0
     model = load_model(model, args.load_model_path)
     model.eval()
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     model.to(device)