BuddyChrist / app.py
Renegadesoffun
Updated for CPU evalgguf
7da9883
raw
history blame
937 Bytes
import streamlit as st
from ggulf import GGUFModel, GGUFTokenizer
import torch
model_name = "TheBloke/TinyLlama-1.1B-Chat-v0.3-GGUF"
# Load model and tokenizer
model = GGUFModel.from_pretrained(model_name)
tokenizer = GGUFTokenizer.from_pretrained(model_name)
# Set model to eval mode
model.eval()
st.title("Buddy Christ Chatbot")
user_input = st.text_input("You:", "")
if user_input:
# Encode input
inputs = tokenizer.encode(user_input, return_tensors="pt")
# Generate response using GGUF
response = model.generate(inputs,
max_length=1000,
temperature=1.0,
top_k=10,
pad_token_id=tokenizer.eos_token_id,
gguf_mode=True)
# Print and display full response
print(response_text)
response_text = tokenizer.decode(response[0])
st.write("Buddy Christ:", response_text)