Shreyas094 commited on
Commit
12fb7a6
·
verified ·
1 Parent(s): 0c47c77

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -1
app.py CHANGED
@@ -103,6 +103,8 @@ def update_vectors(files, parser):
103
 
104
  data = load_document(file_path, parser)
105
  logging.info(f"Loaded {len(data)} chunks from {file.name}")
 
 
106
  all_data.extend(data)
107
  total_chunks += len(data)
108
  # Append new documents instead of replacing
@@ -458,8 +460,12 @@ def get_response_from_pdf(query, model, selected_docs, num_calls=3, temperature=
458
  relevant_docs = retriever.get_relevant_documents(query)
459
  logging.info(f"Number of relevant documents retrieved: {len(relevant_docs)}")
460
 
 
 
 
 
461
  # Filter relevant_docs based on selected documents
462
- filtered_docs = [doc for doc in relevant_docs if doc.metadata["source"] in selected_docs]
463
  logging.info(f"Number of filtered documents: {len(filtered_docs)}")
464
 
465
  if not filtered_docs:
 
103
 
104
  data = load_document(file_path, parser)
105
  logging.info(f"Loaded {len(data)} chunks from {file.name}")
106
+ for chunk in data:
107
+ logging.info(f"Chunk content preview: {chunk.page_content[:100]}...") # Log first 100 characters of each chunk
108
  all_data.extend(data)
109
  total_chunks += len(data)
110
  # Append new documents instead of replacing
 
460
  relevant_docs = retriever.get_relevant_documents(query)
461
  logging.info(f"Number of relevant documents retrieved: {len(relevant_docs)}")
462
 
463
+ # Log the sources of all retrieved documents
464
+ for doc in relevant_docs:
465
+ logging.info(f"Retrieved document source: {doc.metadata['source']}")
466
+
467
  # Filter relevant_docs based on selected documents
468
+ filtered_docs = [doc for doc in relevant_docs if os.path.basename(doc.metadata["source"]) in selected_docs]
469
  logging.info(f"Number of filtered documents: {len(filtered_docs)}")
470
 
471
  if not filtered_docs: