Spaces:

MrOvkill
/

phastfi

Sleeping

MrOvkill commited on Jan 13, 2024

Commit

afd4afc

1 Parent(s): 116b82a

Demo1

Files changed (2) hide show

app.py ADDED Viewed

+from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+from flask import Flask, request, jsonify
+app = Flask(__name__)
+hf_hub_download("TheBloke/phi-2-GGUF", "phi-2.Q8_0.gguf", local_dir="./")
+phi = Llama(model_path="./phi-2.Q8_0.gguf", n_ctx=2048, n_gpu_layers=999)
+app.route("/", methods=["GET"])
+def index():
+    return "<html><body><h1>Use API</h1><p>Use /completion as POST with a prompt in a JSON query.</p></body></html>"
+@app.route("/completion", methods=["POST"])
+def completion():
+    prompt = request.json["prompt"]
+    res = phi(
+        prompt,
+        temperature=0.33,
+        top_p=0.95,
+        top_k=42,
+        max_tokens=1024,
+        num_completions=2,
+    )
+    return jsonify({
+        "responses": [
+            res["choices"][0]["text"],
+            res["choices"][1]["text"]
+        ]
+    })
+if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=7860)

requirements.txt ADDED Viewed

+llama-cpp-python
+huggingface-hub
+flask