lifeofcoding
/

llama-3.2-3b-parser

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

lifeofcoding commited on Oct 12, 2024

Commit

619846d

·

verified ·

1 Parent(s): 7ae55b3

Delete handler.py

Files changed (1) hide show

handler.py +0 -45

handler.py DELETED Viewed

@@ -1,45 +0,0 @@
-from typing import Any, Dict, List
-import torch
-import transformers
-from transformers import AutoModelForCausalLM, AutoTokenizer
-dtype = torch.bfloat16 if torch.cuda.get_device_capability()[0] == 8 else torch.float16
-class EndpointHandler:
-  def __init__(self, path=""):
-    tokenizer = AutoTokenizer.from_pretrained(path, trust_remote_code=True)
-    model = AutoModelForCausalLM.from_pretrained(
-        path,
-        return_dict=True,
-        device_map="auto",
-        load_in_8bit=False,
-        torch_dtype=dtype,
-        trust_remote_code=True,
-    )
-    generation_config = model.generation_config
-    generation_config.max_new_tokens = 10000
-    generation_config.temperature = 0.01
-    generation_config.num_return_sequences = 1
-    generation_config.pad_token_id = tokenizer.eos_token_id
-    generation_config.eos_token_id = tokenizer.eos_token_id
-    self.generation_config = generation_config
-    self.pipeline = transformers.pipeline(
-        "text-generation", model=model, tokenizer=tokenizer
-    )
-  def __call__(self, data: Dist[str, Any]) -> Dict[str, Any]:
-    prompt = data.pop("inputs", data)
-    system_message = """
-You are an expert at analyzing the text of narrative scenes. Only respond with complete JSON responses beginning with [ and end with ]. Do not add new lines Separate the text of the scene to analyze into passages spoken aloud by a character from text not spoken aloud by a character. Identify the character speaking, and the tone being used. To help identify dialog, we have turned all quotation marks into the string SPOOOOOOKEN. For example the sentence SPOOOOOOKENHello, Janet,SPOOOOOOKEN John growled angrily. would result in the following output format: [{"position": 1, "type": "dialog", "narrator": "John", "tone": "angry", "content": "SPOOOOOOKENHello, Janet,SPOOOOOOKEN "}, {"position": 2, "type": "narration", "narrator": "Narrator", "tone": "", "content": "John growled angrily."}] If there is a new-line character, separate it as its own json object. Here is the scene to analyze:
-""".strip()
-    messages = [
-        {"role": "system", "content": system_message},
-        {"role": "user", "content": prompt},
-    ]
-    result = self.pipeline(messages, generation_config=self.generation_config)
-    return result