Spaces:

Moha782
/

GenAIEfrei

Sleeping

Moha782 commited on Jun 27

Commit

76e0d03

•

1 Parent(s): 1dd768c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,11 +1,22 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
 def respond(
     message,
@@ -27,12 +38,16 @@ def respond(
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         top_p=top_p,
     ):
         token = message.choices[0].delta.content
@@ -58,6 +73,5 @@ demo = gr.ChatInterface(
     ],
 )
 if __name__ == "__main__":
     demo.launch()

 import gradio as gr
 from huggingface_hub import InferenceClient
+from pathlib import Path
+from typing import List
+from pdfplumber import open as open_pdf
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
+# Load the PDF file
+pdf_path = Path("path/to/your/pdf/file.pdf")
+with open_pdf(pdf_path) as pdf:
+    text = "\n".join(page.extract_text() for page in pdf.pages)
+# Split the PDF text into chunks
+chunk_size = 1000  # Adjust this value based on your needs
+text_chunks: List[str] = [text[i:i+chunk_size] for i in range(0, len(text), chunk_size)]
 def respond(
     message,
     response = ""
+    # Pass relevant chunks as context
+    relevant_chunks = [chunk for chunk in text_chunks if message.lower() in chunk.lower()]
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         stream=True,
         temperature=temperature,
         top_p=top_p,
+        files={"context": "\n".join(relevant_chunks)},  # Pass relevant chunks as context
     ):
         token = message.choices[0].delta.content
     ],
 )
 if __name__ == "__main__":
     demo.launch()