tfm-media-insights

Runtime error

File size: 1,664 Bytes

cb67dcf
4e5a5be
53f76b1
5ed2636
53f76b1
3ab6ca9
5ed2636
 
 
 
cb67dcf
3ab6ca9
d84d90d
374cee2
cb67dcf
5ed2636
 
 
 
 
53f76b1
 
 
 
 
85574d1
53f76b1
 
26bf4a5
85574d1
53f76b1
 
6dccfc2
ad2c8e4
cb67dcf
53f76b1
 
 
5b87039
 
 
 
53f76b1
 
5b87039
ad2c8e4
cb67dcf
 
e80f947
cb67dcf
 
 
eeb493a
2f1bde3
9d6a48d
cb67dcf
761feb6
cb67dcf

import gradio as gr
import torch
import transformers
# from transformers import AutoTokenizer
from langchain import LLMChain, HuggingFacePipeline, PromptTemplate
import os
from ctransformers import AutoModelForCausalLM, AutoTokenizer

model = AutoModelForCausalLM.from_pretrained("marella/gpt-2-ggml", hf=True)
tokenizer = AutoTokenizer.from_pretrained(model)

access_token = os.getenv("Llama2")

def greet(text):

    model = AutoModelForCausalLM.from_pretrained("marella/gpt-2-ggml", hf=True)
    tokenizer = AutoTokenizer.from_pretrained(model)
    
    # model = "meta-llama/Llama-2-7b-hf"
    # tokenizer = AutoTokenizer.from_pretrained(model, token=access_token)
    
    pipeline = transformers.pipeline(
    "text-generation",
    model=model,
    tokenizer=tokenizer,
    torch_dtype=torch.bfloat16,
    trust_remote_code=True,
    device_map="auto",
    max_length=512,
    do_sample=False,
    top_k=10,
    num_return_sequences=1,
    eos_token_id=tokenizer.eos_token_id,
    token=access_token
    )

    llm = HuggingFacePipeline(pipeline = pipeline, model_kwargs = {'temperature':0})

    template = """Write a concise summary of the following:
                "{text}"
                CONCISE SUMMARY:"""

    prompt = PromptTemplate(template=template, input_variables=["text"])
    llm_chain = LLMChain(prompt=prompt, llm=llm)
    
    return llm_chain.run(text)

with gr.Blocks() as demo:

    text = gr.Textbox(label="Text")
    summary = gr.Textbox(label="Summary")
    greet_btn = gr.Button("Submit")
    clear = gr.ClearButton([text, summary])
    greet_btn.click(fn=greet, inputs=text, outputs=summary, api_name="greet")
    


demo.launch()