|
import gradio as gr |
|
from openai import OpenAI |
|
import os |
|
import numpy as np |
|
from src.document_processing.processor import DocumentProcessor |
|
from src.rag.retriever import Retriever |
|
from src.rag.generator import Generator |
|
from src.api.openai_api import OpenAIAPI |
|
|
|
|
|
api_key = os.environ.get("OPENAI_API_KEY", "") |
|
openai_api = OpenAIAPI(api_key=api_key) |
|
|
|
|
|
document_processor = DocumentProcessor(api_client=openai_api) |
|
retriever = Retriever(api_client=openai_api) |
|
generator = Generator(api_client=openai_api) |
|
|
|
def respond( |
|
message, |
|
history: list[tuple[str, str]], |
|
system_message, |
|
max_tokens, |
|
temperature, |
|
top_p, |
|
): |
|
|
|
use_rag = "bruk dokumenter" in message.lower() or "bruk rag" in message.lower() |
|
|
|
if use_rag: |
|
|
|
try: |
|
|
|
retrieved_chunks = retriever.retrieve(message) |
|
|
|
|
|
response = generator.generate( |
|
query=message, |
|
retrieved_chunks=retrieved_chunks, |
|
temperature=temperature |
|
) |
|
|
|
yield response |
|
return |
|
except Exception as e: |
|
|
|
print(f"RAG failed: {str(e)}, falling back to standard GPT-4o") |
|
|
|
|
|
client = OpenAI(api_key=api_key) |
|
messages = [{"role": "system", "content": system_message}] |
|
|
|
for val in history: |
|
if val[0]: |
|
messages.append({"role": "user", "content": val[0]}) |
|
if val[1]: |
|
messages.append({"role": "assistant", "content": val[1]}) |
|
|
|
messages.append({"role": "user", "content": message}) |
|
|
|
response = "" |
|
|
|
for chunk in client.chat.completions.create( |
|
model="gpt-4o", |
|
messages=messages, |
|
max_tokens=max_tokens, |
|
stream=True, |
|
temperature=temperature, |
|
top_p=top_p, |
|
): |
|
content = chunk.choices[0].delta.content |
|
if content: |
|
response += content |
|
yield response |
|
|
|
|
|
""" |
|
For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface |
|
""" |
|
demo = gr.ChatInterface( |
|
respond, |
|
additional_inputs=[ |
|
gr.Textbox( |
|
value="Du er en hjelpsom assistent som svarer på norsk. Bruk kunnskapen din til å svare på spørsmål. Hvis brukeren skriver 'bruk dokumenter' eller 'bruk RAG', vil du bruke Retrieval-Augmented Generation for å svare basert på opplastede dokumenter.", |
|
label="System message" |
|
), |
|
gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"), |
|
gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"), |
|
gr.Slider( |
|
minimum=0.1, |
|
maximum=1.0, |
|
value=0.95, |
|
step=0.05, |
|
label="Top-p (nucleus sampling)", |
|
), |
|
], |
|
title="Norwegian RAG Chatbot with GPT-4o", |
|
description="En chatbot basert på Retrieval-Augmented Generation (RAG) for norsk språk med GPT-4o. Skriv 'bruk dokumenter' eller 'bruk RAG' i meldingen din for å aktivere RAG-funksjonalitet.", |
|
) |
|
|
|
|
|
with gr.Blocks() as document_upload: |
|
with gr.Tab("Last opp dokumenter"): |
|
with gr.Row(): |
|
with gr.Column(scale=2): |
|
file_output = gr.File(label="Opplastede dokumenter") |
|
upload_button = gr.UploadButton( |
|
"Klikk for å laste opp dokument", |
|
file_types=["pdf", "txt", "html"], |
|
file_count="multiple" |
|
) |
|
|
|
with gr.Column(scale=3): |
|
documents_list = gr.Dataframe( |
|
headers=["Dokument ID", "Filnavn", "Dato", "Chunks"], |
|
label="Dokumentliste", |
|
interactive=False |
|
) |
|
|
|
process_status = gr.Textbox(label="Status", interactive=False) |
|
refresh_btn = gr.Button("Oppdater dokumentliste") |
|
|
|
|
|
upload_button.upload( |
|
fn=document_processor.process_document, |
|
inputs=[upload_button], |
|
outputs=[process_status, documents_list] |
|
) |
|
|
|
refresh_btn.click( |
|
fn=lambda: [[doc_id, meta.get("filename", "N/A"), meta.get("processed_date", "N/A"), meta.get("chunk_count", 0)] |
|
for doc_id, meta in document_processor.get_all_documents().items()], |
|
inputs=None, |
|
outputs=[documents_list] |
|
) |
|
|
|
|
|
app = gr.TabbedInterface([demo, document_upload], ["Chat", "Dokumenter"]) |
|
|
|
if __name__ == "__main__": |
|
app.launch() |
|
|