aliMohammad16 commited on
Commit
49332a9
·
verified ·
1 Parent(s): b2c1dd8

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +20 -0
app.py ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from fastapi import FastAPI
2
+ from transformers import AutoModelForCausalLM, AutoTokenizer
3
+ import torch
4
+
5
+ app = FastAPI()
6
+
7
+ MODEL_NAME = "deepseek-ai/deepseek-llm-7b"
8
+ tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
9
+ model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, torch_dtype=torch.float16, device_map="auto")
10
+
11
+ @app.get("/")
12
+ def root():
13
+ return {"message": "DeepSeek API is running!"}
14
+
15
+ @app.post("/summarize/")
16
+ async def summarize(input_text: str):
17
+ inputs = tokenizer(input_text, return_tensors="pt").to("cuda")
18
+ output = model.generate(**inputs, max_new_tokens=100)
19
+ summary = tokenizer.decode(output[0], skip_special_tokens=True)
20
+ return {"summary": summary}