Spaces:

xuqinyang
/

Baichuan-13B-Chat

Runtime error

xuqinyang commited on Jul 22, 2023

Commit

dbc3c4a

1 Parent(s): ea0d3c0

Update model.py

Files changed (1) hide show

model.py CHANGED Viewed

@@ -9,7 +9,7 @@ from huggingface_hub import snapshot_download
 snapshot_download(model_id, local_dir="./")
 from llama_cpp import Llama
-self.llm = Llama(model_path="./ggml-model-q4_0.bin", n_ctx=4096,seed=-1,n_threads=4)
 def run(message: str,
         chat_history: list[tuple[str, str]],
@@ -22,6 +22,6 @@ def run(message: str,
     for i in chat_history:
         history.append({"role": "user", "content": i[0]})
         history.append({"role": "assistant", "content": i[1]})
-    for response in self.llm.create_chat_completion(messages,stream=True,max_tokens=-1,temperature=0.3,top_k=5,top_p=0.85,repeat_penalty=1.1):
         if "content" in response["choices"][0]["delta"]:
             yield response["choices"][0]["delta"]["content"]

 snapshot_download(model_id, local_dir="./")
 from llama_cpp import Llama
+llm = Llama(model_path="./ggml-model-q4_0.bin", n_ctx=4096,seed=-1,n_threads=4)
 def run(message: str,
         chat_history: list[tuple[str, str]],
     for i in chat_history:
         history.append({"role": "user", "content": i[0]})
         history.append({"role": "assistant", "content": i[1]})
+    for response in llm.create_chat_completion(messages,stream=True,max_tokens=-1,temperature=0.3,top_k=5,top_p=0.85,repeat_penalty=1.1):
         if "content" in response["choices"][0]["delta"]:
             yield response["choices"][0]["delta"]["content"]