whatsthispdf04

Running

mitulagr2 commited on Jul 11, 2024

Commit

ce047d8

1 Parent(s): 889a629

Update rag.py

Files changed (1) hide show

app/rag.py CHANGED Viewed

@@ -26,7 +26,7 @@ class ChatPDF:
     pdf_count = 0
     def __init__(self):
-        self.text_parser = SentenceSplitter(chunk_size=128, chunk_overlap=8)
         logger.info("initializing the vector store related objects")
         # client = QdrantClient(host="localhost", port=6333)
@@ -45,9 +45,9 @@ class ChatPDF:
         llm = LlamaCPP(
             model_url="https://huggingface.co/Qwen/Qwen2-0.5B-Instruct-GGUF/resolve/main/qwen2-0_5b-instruct-fp16.gguf",
             temperature=0.1,
-            max_new_tokens=256,
             # context_window=3900, #32k
-            generate_kwargs={"max_tokens": 256, "temperature": 0.1, "top_k": 12},
             # model_kwargs={"n_gpu_layers": -1},
             # messages_to_prompt=self.messages_to_prompt,
             # completion_to_prompt=self.completion_to_prompt,
@@ -103,7 +103,7 @@ class ChatPDF:
         self.query_engine = index.as_query_engine(
             streaming=True,
-            similarity_top_k=12,
         )
     def ask(self, query: str):

     pdf_count = 0
     def __init__(self):
+        self.text_parser = SentenceSplitter(chunk_size=1024, chunk_overlap=24)
         logger.info("initializing the vector store related objects")
         # client = QdrantClient(host="localhost", port=6333)
         llm = LlamaCPP(
             model_url="https://huggingface.co/Qwen/Qwen2-0.5B-Instruct-GGUF/resolve/main/qwen2-0_5b-instruct-fp16.gguf",
             temperature=0.1,
+            max_new_tokens=128,
             # context_window=3900, #32k
+            generate_kwargs={"max_tokens": 128, "temperature": 0.1, "top_k": 3},
             # model_kwargs={"n_gpu_layers": -1},
             # messages_to_prompt=self.messages_to_prompt,
             # completion_to_prompt=self.completion_to_prompt,
         self.query_engine = index.as_query_engine(
             streaming=True,
+            similarity_top_k=3,
         )
     def ask(self, query: str):