Spaces:

Linly-AI
/

Linly-ChatFlow

Runtime error

wmpscc commited on Jul 23, 2023

Commit

a6b7210

1 Parent(s): 3813a21

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -41,7 +41,7 @@ def init_args():
     args = load_hyperparam(args)
     # args.tokenizer = Tokenizer(model_path=args.spm_model_path)
-    args.tokenizer = AutoTokenizer.from_pretrained("Linly-AI/Linly-ChatFlow", use_fast=False, trust_remote_code=True)
     args.vocab_size = args.tokenizer.sp_model.vocab_size()
@@ -57,8 +57,8 @@ def init_model():
     # device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     # model.to(device)
-    model = AutoModelForCausalLM.from_pretrained("Linly-AI/Linly-ChatFlow", device_map="auto", torch_dtype=torch.float16, trust_remote_code=True)
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     lm_generation = LmGeneration(model, args.tokenizer)

     args = load_hyperparam(args)
     # args.tokenizer = Tokenizer(model_path=args.spm_model_path)
+    args.tokenizer = AutoTokenizer.from_pretrained("Linly-AI/Chinese-LLaMA-2-7B-hf", use_fast=False, trust_remote_code=True)
     args.vocab_size = args.tokenizer.sp_model.vocab_size()
     # device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     # model.to(device)
+    model = AutoModelForCausalLM.from_pretrained("Linly-AI/Chinese-LLaMA-2-7B-hf", device_map="auto", torch_dtype=torch.float16, trust_remote_code=True)
+    print(model)
     print(torch.cuda.max_memory_allocated() / 1024 ** 3)
     lm_generation = LmGeneration(model, args.tokenizer)