Deepakvictor
/

tan-ta

text2text-generation

Inference Endpoints

Model card Files Files and versions Community

Deepakvictor commited on Aug 14, 2023

Commit

3da6512

•

1 Parent(s): 32681ab

Create handler.py

Files changed (1) hide show

handler.py +17 -0

handler.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from typing import Dict, List, Any
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
+import torch
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+class EndpointHandler:
+    def __init__(self, path=""):
+        self.tokenizer = AutoTokenizer.from_pretrained(path).to(device)
+        self.model = AutoModelForSeq2SeqLM.from_pretrained(path).to(device))
+    def __call__(self, data: str) -> str:
+        inp = self.tokenizer(data, return_tensors="pt")
+        for q in inp:
+            inp[q] = inp[q].to(device)
+        with torch.inference_mode():
+            out= model.generate(**inp)
+        final_output = tokenizer.batch_decode(out,skip_special_tokens=True)
+        return {"translation": final_output[0]}