Spaces:
Runtime error
Runtime error
yosuke123456
commited on
Commit
β’
8fc89a7
1
Parent(s):
3ec0b48
Add application file
Browse files- .gitattributes +4 -0
- ALV2_ALV3DTUζδ½γγγ₯γ’γ«DTU-V3SET01.pdf +3 -0
- ALV3PCγ΅γΌγ_γ½γγγ¦γ§γ’ζδ½γγγ₯γ’γ«_η»εγγ‘γ€γ«εδ».pdf +3 -0
- app.py +98 -0
- requirements.txt +0 -0
- ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εε.pdf +3 -0
- ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εΎε.pdf +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
ALV2_ALV3DTUζδ½γγγ₯γ’γ«DTU-V3SET01.pdf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
ALV3PCγ΅γΌγ_γ½γγγ¦γ§γ’ζδ½γγγ₯γ’γ«_η»εγγ‘γ€γ«εδ».pdf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εΎε.pdf filter=lfs diff=lfs merge=lfs -text
|
39 |
+
ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εε.pdf filter=lfs diff=lfs merge=lfs -text
|
ALV2_ALV3DTUζδ½γγγ₯γ’γ«DTU-V3SET01.pdf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04320ba9416cd11d758c80ec22663f3d7f06270aa034cde26a978af2563e7879
|
3 |
+
size 5539267
|
ALV3PCγ΅γΌγ_γ½γγγ¦γ§γ’ζδ½γγγ₯γ’γ«_η»εγγ‘γ€γ«εδ».pdf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de1312a63aa1ab60a6353694bfb8d87d709a71e7ebd77e06f1292ec03c497497
|
3 |
+
size 30541345
|
app.py
ADDED
@@ -0,0 +1,98 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# https://qiita.com/nekoniii3/items/5acf764af65212d9f04f
|
2 |
+
|
3 |
+
import gradio as gr
|
4 |
+
import random
|
5 |
+
import time
|
6 |
+
|
7 |
+
import os
|
8 |
+
|
9 |
+
from langchain_community.document_loaders import PyMuPDFLoader
|
10 |
+
from langchain.text_splitter import RecursiveCharacterTextSplitter
|
11 |
+
# from langchain_community.chat_models import ChatOpenAI
|
12 |
+
from langchain_openai import ChatOpenAI
|
13 |
+
from langchain_community.vectorstores import Chroma
|
14 |
+
from langchain.chains import RetrievalQA
|
15 |
+
from langchain_community.embeddings import OpenAIEmbeddings
|
16 |
+
|
17 |
+
|
18 |
+
|
19 |
+
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
20 |
+
os.environ["OPENAI_API_KEY"] = "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"
|
21 |
+
|
22 |
+
file_name1 = 'ALV2_ALV3DTUζδ½γγγ₯γ’γ«DTU-V3SET01.pdf'
|
23 |
+
file_name2 = 'ALV3PCγ΅γΌγ_γ½γγγ¦γ§γ’ζδ½γγγ₯γ’γ«_η»εγγ‘γ€γ«εδ».pdf'
|
24 |
+
file_name3 = 'ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εε.pdf'
|
25 |
+
file_name4 = 'ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εΎε.pdf'
|
26 |
+
|
27 |
+
loader1 = PyMuPDFLoader(file_name1)
|
28 |
+
loader2 = PyMuPDFLoader(file_name2)
|
29 |
+
loader3 = PyMuPDFLoader(file_name3)
|
30 |
+
loader4 = PyMuPDFLoader(file_name4)
|
31 |
+
|
32 |
+
documents1 = loader1.load()
|
33 |
+
documents2 = loader2.load()
|
34 |
+
documents3 = loader3.load()
|
35 |
+
documents4 = loader4.load()
|
36 |
+
|
37 |
+
text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
|
38 |
+
|
39 |
+
texts1 = text_splitter.split_documents(documents1)
|
40 |
+
texts2 = text_splitter.split_documents(documents2)
|
41 |
+
texts3 = text_splitter.split_documents(documents3)
|
42 |
+
texts4 = text_splitter.split_documents(documents4)
|
43 |
+
texts = texts1 + texts2 + texts3 + texts4
|
44 |
+
|
45 |
+
embeddings = OpenAIEmbeddings(model="text-embedding-ada-002")
|
46 |
+
vectordb = Chroma.from_documents(texts, embeddings)
|
47 |
+
llm = ChatOpenAI(model_name="gpt-3.5-turbo-16k", temperature=0.05)
|
48 |
+
|
49 |
+
qa = RetrievalQA.from_chain_type(
|
50 |
+
llm=llm,
|
51 |
+
chain_type="stuff",
|
52 |
+
retriever=vectordb.as_retriever(),
|
53 |
+
return_source_documents=True)
|
54 |
+
|
55 |
+
import shutil
|
56 |
+
def save_image_filepath(filepath: str):
|
57 |
+
print(filepath)
|
58 |
+
# γ€γ‘γΌγΈγδΏε
|
59 |
+
_, file_extension = os.path.splitext(filepath)
|
60 |
+
shutil.copy(filepath, './filepath{}'.format(file_extension))
|
61 |
+
pass
|
62 |
+
|
63 |
+
with gr.Blocks() as demo:
|
64 |
+
chatbot = gr.Chatbot()
|
65 |
+
# with gr.Row():
|
66 |
+
# with gr.Column():
|
67 |
+
# image_input_filepath = gr.Image(type='filepath')
|
68 |
+
# image_button_filepath = gr.Button("filepath")
|
69 |
+
|
70 |
+
# image_button_filepath.click(save_image_filepath, inputs=image_input_filepath)
|
71 |
+
|
72 |
+
msg = gr.Textbox()
|
73 |
+
|
74 |
+
def user(user_message, history):
|
75 |
+
reply2 = qa(user_message)
|
76 |
+
reply=reply2['result']
|
77 |
+
|
78 |
+
for sd in reply2["source_documents"]:
|
79 |
+
page_content = str(sd.page_content)
|
80 |
+
source = str(sd.metadata["source"])
|
81 |
+
page = str(sd.metadata["page"]+1).zfill(3)
|
82 |
+
print("PDFοΌ" + source)
|
83 |
+
print("γγΌγΈοΌ" + page)
|
84 |
+
|
85 |
+
reply = reply + '<a href="https://dcs.mediapress-net.com/iportal/cv.do?c=20958580000&pg=108&v=MIW10001&d=LINK_MIW">link</a>'
|
86 |
+
|
87 |
+
return "", history + [[user_message, reply]]
|
88 |
+
|
89 |
+
def bot(history):
|
90 |
+
yield history
|
91 |
+
# save_image_filepath("./IMG_yosuke2.jpg")
|
92 |
+
|
93 |
+
msg.submit(user, [msg, chatbot], [msg, chatbot], queue=True).then(
|
94 |
+
bot, chatbot, chatbot
|
95 |
+
)
|
96 |
+
|
97 |
+
demo.queue()
|
98 |
+
demo.launch(share=True)
|
requirements.txt
ADDED
Binary file (6.49 kB). View file
|
|
ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εε.pdf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d80f5dc28cd581b4811c24de29b98524856292e196a430c7d360c511363c1889
|
3 |
+
size 168321766
|
ηΎεγγγ―η·εγ«γΏγγ°η¬¬31η_εΎε.pdf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebe14b6c3d2a83c3da76e85427b492678802549093442b78790174dcf42ae385
|
3 |
+
size 88753140
|