Spaces:

Ateeqq
/

Meta-Llama-3-8B-Instruct

Runtime error

hanzla commited on Apr 18, 2024

Commit

1b3204d

1 Parent(s): 5408877

reqs added

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,21 +4,26 @@ import torch
 import transformers
 import torch
-model_id = "meta-llama/Meta-Llama-3-8B"
-pipeline = transformers.pipeline(
-    "text-generation", model=model_id, model_kwargs={"torch_dtype": torch.bfloat16}, device_map="auto"
-)
 @spaces.GPU
 def yes_man(message, history):
-    return pipeline(message)
 gr.ChatInterface(
     yes_man,
     chatbot=gr.Chatbot(height=300),
-    textbox=gr.Textbox(placeholder="Ask me a yes or no question", container=False, scale=7),
-    title="Yes Man",
     description="Ask Yes Man any question",
     theme="soft",
     examples=["Hello", "Am I cool?", "Are tomatoes vegetables?"],

 import transformers
 import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+model_name = "meta-llama/Meta-Llama-3-8B"
+tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16,device_map="auto")
 @spaces.GPU
 def yes_man(message, history):
+    input_ids = tokenizer(message, return_tensors="pt").input_ids.to(model.device)
+    output = model.generate(input_ids, max_length=512, num_return_sequences=1)
+    detailed_prompt = tokenizer.decode(output[0], skip_special_tokens=True)
+    return detailed_prompt
 gr.ChatInterface(
     yes_man,
     chatbot=gr.Chatbot(height=300),
+    textbox=gr.Textbox(placeholder="Enter message here", container=False, scale=7),
+    title="LLAMA 3 8B Chat",
     description="Ask Yes Man any question",
     theme="soft",
     examples=["Hello", "Am I cool?", "Are tomatoes vegetables?"],