Spaces:

Alessio2405
/

HostMixCPU

Sleeping

Alessio2405 commited on Mar 1, 2024

Commit

8adc0ac

verified ·

1 Parent(s): 11abc6c

Upload 5 files

Files changed (6) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+mistral-7b-openorca.Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text

Dockerfile ADDED Viewed

+FROM python:3.9
+WORKDIR /code
+COPY ./requirements.txt /code/requirements.txt
+RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
+COPY ./mistral-7b-openorca.Q4_K_S /code/mistral-7b-openorca.Q4_K_S
+COPY ./main.py /code/main.py
+CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

README.md CHANGED Viewed

@@ -1,10 +1,11 @@
 ---
-title: HostMixCPU
-emoji: 🐨
-colorFrom: yellow
 colorTo: pink
 sdk: docker
 pinned: false
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: LLM Deployment Zerocost Api
+emoji: 😻
+colorFrom: purple
 colorTo: pink
 sdk: docker
 pinned: false
+license: mit
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

main.py ADDED Viewed

+from ctransformers import AutoModelForCausalLM
+from fastapi import FastAPI, Form
+from pydantic import BaseModel
+#Model loading
+llm = AutoModelForCausalLM.from_pretrained("mistral-7b-openorca.Q4_K_S.gguf",
+model_type='mistral',
+max_new_tokens = 1096,
+threads = 3,
+)
+#Pydantic object
+class validation(BaseModel):
+    prompt: str
+#Fast API
+app = FastAPI()
+#Zephyr completion
+@app.post("/llm_on_cpu")
+async def stream(item: validation):
+    system_prompt = 'Below is an instruction that describes a task. Write a response that appropriately completes the request. Write only in ITALIAN.'
+    E_INST = "</s>"
+    user, assistant = "<|user|>", "<|assistant|>"
+    prompt = f"{system_prompt}{E_INST}\n{user}\n{item.prompt.strip()}{E_INST}\n{assistant}\n"
+    return llm(prompt)

mistral-7b-openorca.Q4_K_S.gguf ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e72b3262c11ba4104cd31931d53b2b42723114f2063afd408b6f9d4da06515b
+size 4140385024

requirements.txt ADDED Viewed

+python-multipart
+fastapi
+pydantic
+uvicorn
+requests
+ctransformers