DrishtiSharma commited on
Commit
2e95a3a
·
verified ·
1 Parent(s): c0f8ffc

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -6,7 +6,7 @@ from langchain.agents import AgentExecutor, create_openai_tools_agent
6
  from langchain_core.messages import BaseMessage, HumanMessage
7
  from langchain_community.tools.tavily_search import TavilySearchResults
8
  from langchain_experimental.tools import PythonREPLTool
9
- from langchain_community.document_loaders import DirectoryLoader, TextLoader
10
  from langchain.text_splitter import RecursiveCharacterTextSplitter
11
  from langchain_community.vectorstores import Chroma
12
  from langchain.embeddings import HuggingFaceBgeEmbeddings
@@ -15,6 +15,7 @@ from langchain_core.runnables import RunnablePassthrough
15
  from langchain.output_parsers.openai_functions import JsonOutputFunctionsParser
16
  from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
17
  from langgraph.graph import StateGraph, END
 
18
  from typing import Annotated, Sequence, TypedDict
19
  import functools
20
  import operator
@@ -73,7 +74,7 @@ if uploaded_files:
73
  docs = []
74
  for uploaded_file in uploaded_files:
75
  content = uploaded_file.read().decode("utf-8")
76
- docs.append(TextLoader(file_path=None, content=content).load()[0])
77
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=100, chunk_overlap=10, length_function=len)
78
  new_docs = text_splitter.split_documents(documents=docs)
79
  embeddings = HuggingFaceBgeEmbeddings(model_name="BAAI/bge-base-en-v1.5", model_kwargs={'device': 'cpu'}, encode_kwargs={'normalize_embeddings': True})
 
6
  from langchain_core.messages import BaseMessage, HumanMessage
7
  from langchain_community.tools.tavily_search import TavilySearchResults
8
  from langchain_experimental.tools import PythonREPLTool
9
+ from langchain_community.document_loaders import DirectoryLoader
10
  from langchain.text_splitter import RecursiveCharacterTextSplitter
11
  from langchain_community.vectorstores import Chroma
12
  from langchain.embeddings import HuggingFaceBgeEmbeddings
 
15
  from langchain.output_parsers.openai_functions import JsonOutputFunctionsParser
16
  from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
17
  from langgraph.graph import StateGraph, END
18
+ from langchain_core.documents import Document
19
  from typing import Annotated, Sequence, TypedDict
20
  import functools
21
  import operator
 
74
  docs = []
75
  for uploaded_file in uploaded_files:
76
  content = uploaded_file.read().decode("utf-8")
77
+ docs.append(Document(page_content=content, metadata={"name": uploaded_file.name}))
78
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=100, chunk_overlap=10, length_function=len)
79
  new_docs = text_splitter.split_documents(documents=docs)
80
  embeddings = HuggingFaceBgeEmbeddings(model_name="BAAI/bge-base-en-v1.5", model_kwargs={'device': 'cpu'}, encode_kwargs={'normalize_embeddings': True})