Spaces:

PartAI
/

Dorna-Llama3-8B-Instruct-GGUF

Running

MiladMola commited on Jun 15

Commit

cf29295

•

1 Parent(s): 97bef91

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,12 +12,12 @@ from huggingface_hub import hf_hub_download
 hf_hub_download(
     repo_id="PartAI/Dorna-Llama3-8B-Instruct-GGUF",
     filename="dorna-llama3-8b-instruct.Q2_K.gguf",
-    local_dir = "./models"
 )
 hf_hub_download(
     repo_id="PartAI/Dorna-Llama3-8B-Instruct-GGUF",
     filename="dorna-llama3-8b-instruct.Q4_0.gguf",
-    local_dir = "./models"
 )
 css = """
@@ -57,7 +57,7 @@ def respond(
     chat_template = get_messages_formatter_type(model)
     llm = Llama(
-        model_path=f"models/{model}",
         flash_attn=True,
         n_threads=40,
         n_gpu_layers=81,

 hf_hub_download(
     repo_id="PartAI/Dorna-Llama3-8B-Instruct-GGUF",
     filename="dorna-llama3-8b-instruct.Q2_K.gguf",
+    local_dir = "."
 )
 hf_hub_download(
     repo_id="PartAI/Dorna-Llama3-8B-Instruct-GGUF",
     filename="dorna-llama3-8b-instruct.Q4_0.gguf",
+    local_dir = "."
 )
 css = """
     chat_template = get_messages_formatter_type(model)
     llm = Llama(
+        model_path=f"./{model}",
         flash_attn=True,
         n_threads=40,
         n_gpu_layers=81,