yuhaofeng-shiba commited on
Commit
aed5af0
·
1 Parent(s): 6259eea

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -20,7 +20,7 @@ def init_args():
20
  args.config_path = './config/llama_7b.json'
21
  args.spm_model_path = './model_file/tokenizer.model'
22
  args.batch_size = 1
23
- args.seq_length = 256
24
  args.world_size = 1
25
  args.use_int8 = True
26
  args.top_p = 0
@@ -41,6 +41,7 @@ def init_model():
41
  torch.set_default_tensor_type(torch.FloatTensor)
42
  model = load_model(model, args.load_model_path)
43
  model.eval()
 
44
 
45
  print(torch.cuda.max_memory_allocated() / 1024 ** 3)
46
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
20
  args.config_path = './config/llama_7b.json'
21
  args.spm_model_path = './model_file/tokenizer.model'
22
  args.batch_size = 1
23
+ args.seq_length = 512
24
  args.world_size = 1
25
  args.use_int8 = True
26
  args.top_p = 0
 
41
  torch.set_default_tensor_type(torch.FloatTensor)
42
  model = load_model(model, args.load_model_path)
43
  model.eval()
44
+ print(model)
45
 
46
  print(torch.cuda.max_memory_allocated() / 1024 ** 3)
47
  device = torch.device("cuda" if torch.cuda.is_available() else "cpu")