Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -113,7 +113,7 @@ def loadAndSplitPdfFile(filePath):
|
|
113 |
img_metadata["image_index"] = img_index
|
114 |
documents.append(Document(page_content=ocr_text, metadata=img_metadata))
|
115 |
|
116 |
-
splitter = RecursiveCharacterTextSplitter(chunk_size=
|
117 |
final_chunks = splitter.split_documents(documents)
|
118 |
return final_chunks
|
119 |
|
|
|
113 |
img_metadata["image_index"] = img_index
|
114 |
documents.append(Document(page_content=ocr_text, metadata=img_metadata))
|
115 |
|
116 |
+
splitter = RecursiveCharacterTextSplitter(chunk_size=1500, chunk_overlap=500)
|
117 |
final_chunks = splitter.split_documents(documents)
|
118 |
return final_chunks
|
119 |
|