Spaces:

quoc-khanh
/

chatbot4nct_test1

Sleeping

quoc-khanh commited on Feb 25

Commit

77263a0

verified ·

1 Parent(s): fd22419

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -20,36 +20,6 @@ key = "AIzaSyDJ4vIKuIBIPNHATLxnoHlagXWbsAz-vRs"
 # Cấu hình API key cho Google GenAI
 genai.configure(api_key=key)
-### loop cho tất cả các file tài liệu và cộng lại thành final_all_split (nhét vào 1 database)
-folder_path = 'syllabus_nct_word_format/'
-docx_files = list_docx_files(folder_path)
-all_splits = []  # Khởi tạo danh sách lưu kết quả
-for i, file_path in enumerate(tqdm(docx_files, desc="Đang xử lý", unit="file")):
-    output_json_path = f"output_{i}.json"
-    splits = get_splits(file_path, output_json_path)
-    all_splits += splits
-# output_json_path = "output_{i}.json"
-# splits = get_splits(docx_files, output_json_path)
-# all_splits += splits
-FAQ_path = 'syllabus_nct_word_format/FAQ.json'
-FAQ_splits = get_json_splits_only(FAQ_path)
-all_splits += FAQ_splits
-# web_path = 'https'
-# web_splits = await get_urls_splits(url='https://nct.neu.edu.vn/')
-# all_splits += web_splits
-# Lưu vào vectorstore với nhúng từ GenAI (Cần chỉ định model)
-embedding = GoogleGenerativeAIEmbeddings(model="models/text-embedding-004")
-vectorstore = FAISS.from_documents(documents=all_splits, embedding=embedding)
-###
 institutions = ['Tất cả'] + ['Trường Công Nghệ']
 categories = ['Tất cả'] + ['Đề án', 'Chương trình đào tạo']

 # Cấu hình API key cho Google GenAI
 genai.configure(api_key=key)
 institutions = ['Tất cả'] + ['Trường Công Nghệ']
 categories = ['Tất cả'] + ['Đề án', 'Chương trình đào tạo']