Spaces:
Paused
Paused
Shreyas094
commited on
Update app.py
Browse files
app.py
CHANGED
@@ -103,6 +103,8 @@ def update_vectors(files, parser):
|
|
103 |
|
104 |
data = load_document(file_path, parser)
|
105 |
logging.info(f"Loaded {len(data)} chunks from {file.name}")
|
|
|
|
|
106 |
all_data.extend(data)
|
107 |
total_chunks += len(data)
|
108 |
# Append new documents instead of replacing
|
@@ -458,8 +460,12 @@ def get_response_from_pdf(query, model, selected_docs, num_calls=3, temperature=
|
|
458 |
relevant_docs = retriever.get_relevant_documents(query)
|
459 |
logging.info(f"Number of relevant documents retrieved: {len(relevant_docs)}")
|
460 |
|
|
|
|
|
|
|
|
|
461 |
# Filter relevant_docs based on selected documents
|
462 |
-
filtered_docs = [doc for doc in relevant_docs if doc.metadata["source"] in selected_docs]
|
463 |
logging.info(f"Number of filtered documents: {len(filtered_docs)}")
|
464 |
|
465 |
if not filtered_docs:
|
|
|
103 |
|
104 |
data = load_document(file_path, parser)
|
105 |
logging.info(f"Loaded {len(data)} chunks from {file.name}")
|
106 |
+
for chunk in data:
|
107 |
+
logging.info(f"Chunk content preview: {chunk.page_content[:100]}...") # Log first 100 characters of each chunk
|
108 |
all_data.extend(data)
|
109 |
total_chunks += len(data)
|
110 |
# Append new documents instead of replacing
|
|
|
460 |
relevant_docs = retriever.get_relevant_documents(query)
|
461 |
logging.info(f"Number of relevant documents retrieved: {len(relevant_docs)}")
|
462 |
|
463 |
+
# Log the sources of all retrieved documents
|
464 |
+
for doc in relevant_docs:
|
465 |
+
logging.info(f"Retrieved document source: {doc.metadata['source']}")
|
466 |
+
|
467 |
# Filter relevant_docs based on selected documents
|
468 |
+
filtered_docs = [doc for doc in relevant_docs if os.path.basename(doc.metadata["source"]) in selected_docs]
|
469 |
logging.info(f"Number of filtered documents: {len(filtered_docs)}")
|
470 |
|
471 |
if not filtered_docs:
|