Spaces:

Linly-AI
/

Linly-ChatFlow

Runtime error

yuhaofeng-shiba commited on May 12, 2023

Commit

aed5af0

1 Parent(s): 6259eea

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,7 +20,7 @@ def init_args():
     args.config_path = './config/llama_7b.json'
     args.spm_model_path = './model_file/tokenizer.model'
     args.batch_size = 1
-    args.seq_length = 256
     args.world_size = 1
     args.use_int8 = True
     args.top_p = 0
@@ -41,6 +41,7 @@ def init_model():
     torch.set_default_tensor_type(torch.FloatTensor)
     model = load_model(model, args.load_model_path)
     model.eval()
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

     args.config_path = './config/llama_7b.json'
     args.spm_model_path = './model_file/tokenizer.model'
     args.batch_size = 1
+    args.seq_length = 512
     args.world_size = 1
     args.use_int8 = True
     args.top_p = 0
     torch.set_default_tensor_type(torch.FloatTensor)
     model = load_model(model, args.load_model_path)
     model.eval()
+    print(model)
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     device = torch.device("cuda" if torch.cuda.is_available() else "cpu")