Spaces:

Pearx
/

ChatGPT-Assistant

Runtime error

App Files Files Community

Pearx commited on Apr 26, 2023

Commit

cea8bca

•

1 Parent(s): 00fa5e9

Update helper.py

Browse files

Files changed (1) hide show

helper.py +72 -65

helper.py CHANGED Viewed

@@ -1,73 +1,48 @@
 import json
 import os
 import re
-import builtins
-import shutil
 import uuid
-from functools import wraps
 import streamlit as st
 import pandas as pd
 from custom import *
-# 聊天记录处理
-def clear_folder(path):
-    if not os.path.exists(path):
-        return
-    for file_name in os.listdir(path):
-        file_path = os.path.join(path, file_name)
-        try:
-            shutil.rmtree(file_path)
-        except Exception:
-            pass
-def set_chats_path():
-    save_path = 'chat_history'
-    if 'apikey' not in st.secrets:
-        clear_folder('tem_files')
-        save_path = 'tem_files/tem_chat' + str(uuid.uuid4())
-    return save_path
-# 重新open函数，路径不存在时自动创建
-def create_path(func):
-    @wraps(func)
-    def wrapper(path, *args, **kwargs):
-        if not os.path.exists(os.path.dirname(path)):
-            os.makedirs(os.path.dirname(path))
-        return func(path, *args, **kwargs)
-    return wrapper
-open = create_path(builtins.open)
-def get_history_chats(path):
-    try:
-        os.makedirs(path)
-    except FileExistsError:
-        pass
-    files = [f for f in os.listdir(f'./{path}') if f.endswith('.json')]
-    files_with_time = [(f, os.stat(f'./{path}/' + f).st_ctime) for f in files]
-    sorted_files = sorted(files_with_time, key=lambda x: x[1], reverse=True)
-    chat_names = [os.path.splitext(f[0])[0] for f in sorted_files]
-    if len(chat_names) == 0:
-        chat_names.append('New Chat_' + str(uuid.uuid4()))
     return chat_names
 def save_data(path: str, file_name: str, history: list, paras: dict, contexts: dict, **kwargs):
     with open(f"./{path}/{file_name}.json", 'w', encoding='utf-8') as f:
         json.dump({"history": history, "paras": paras, "contexts": contexts, **kwargs}, f)
-def remove_data(path: str, file_name: str):
     try:
-        os.remove(f"./{path}/{file_name}.json")
     except FileNotFoundError:
         pass
 def load_data(path: str, file_name: str) -> dict:
@@ -76,12 +51,14 @@ def load_data(path: str, file_name: str) -> dict:
             data = json.load(f)
             return data
     except FileNotFoundError:
-        with open(f"./{path}/{file_name}.json", 'w', encoding='utf-8') as f:
-            f.write(json.dumps(initial_content_all))
-        return initial_content_all
-def show_each_message(message, role, area=None):
     if area is None:
         area = [st.markdown] * 2
     if role == 'user':
@@ -106,23 +83,26 @@ def show_messages(messages: list):
 # 根据context_level提取history
-def get_history_input(history, level):
-    df_history = pd.DataFrame(history)
-    df_system = df_history.query('role=="system"')
-    df_input = df_history.query('role!="system"')
-    df_input = df_input[-level * 2:]
-    res = pd.concat([df_system, df_input], ignore_index=True).to_dict('records')
     return res
 # 去除#号右边的空格
-def remove_hashtag_right__space(text):
     res = re.sub(r"(#+)\s*", r"\1", text)
     return res
 # 提取文本
-def extract_chars(text, num):
     char_num = 0
     chars = ''
     for char in text:
@@ -134,4 +114,31 @@ def extract_chars(text, num):
         chars += char
         if char_num >= num:
             break
-    return chars

 import json
 import os
 import re
 import uuid
 import streamlit as st
 import pandas as pd
 from custom import *
+import copy
+import io
+def get_history_chats(path: str) -> list:
+    if "apikey" in st.secrets:
+        if not os.path.exists(path):
+            os.makedirs(path)
+        files = [f for f in os.listdir(f'./{path}') if f.endswith('.json')]
+        files_with_time = [(f, os.stat(f'./{path}/' + f).st_ctime) for f in files]
+        sorted_files = sorted(files_with_time, key=lambda x: x[1], reverse=True)
+        chat_names = [os.path.splitext(f[0])[0] for f in sorted_files]
+        if len(chat_names) == 0:
+            chat_names.append('New Chat_' + str(uuid.uuid4()))
+    else:
+        chat_names = ['New Chat_' + str(uuid.uuid4())]
     return chat_names
 def save_data(path: str, file_name: str, history: list, paras: dict, contexts: dict, **kwargs):
+    if not os.path.exists(path):
+        os.makedirs(path)
     with open(f"./{path}/{file_name}.json", 'w', encoding='utf-8') as f:
         json.dump({"history": history, "paras": paras, "contexts": contexts, **kwargs}, f)
+def remove_data(path: str, chat_name: str):
     try:
+        os.remove(f"./{path}/{chat_name}.json")
     except FileNotFoundError:
         pass
+    # 清除缓存
+    try:
+        st.session_state.pop('history' + chat_name)
+        for item in ["context_select", "context_input", "context_level", *initial_content_all['paras']]:
+            st.session_state.pop(item + chat_name + "value")
+    except KeyError:
+        pass
 def load_data(path: str, file_name: str) -> dict:
             data = json.load(f)
             return data
     except FileNotFoundError:
+        content = copy.deepcopy(initial_content_all)
+        if "apikey" in st.secrets:
+            with open(f"./{path}/{file_name}.json", 'w', encoding='utf-8') as f:
+                f.write(json.dumps(content))
+        return content
+def show_each_message(message: str, role: str, area=None):
     if area is None:
         area = [st.markdown] * 2
     if role == 'user':
 # 根据context_level提取history
+def get_history_input(history: list, level: int) -> list:
+    if level != 0:
+        df_history = pd.DataFrame(history)
+        df_system = df_history.query('role=="system"')
+        df_input = df_history.query('role!="system"')
+        df_input = df_input[-level * 2:]
+        res = pd.concat([df_system, df_input], ignore_index=True).to_dict('records')
+    else:
+        res = []
     return res
 # 去除#号右边的空格
+def remove_hashtag_right__space(text: str) -> str:
     res = re.sub(r"(#+)\s*", r"\1", text)
     return res
 # 提取文本
+def extract_chars(text: str, num: int) -> str:
     char_num = 0
     chars = ''
     for char in text:
         chars += char
         if char_num >= num:
             break
+    return chars
+def download_history(history: list):
+    md_text = ""
+    for msg in history:
+        if msg['role'] == 'user':
+            md_text += f'## {user_name}：\n{msg["content"]}\n'
+        elif msg['role'] == 'assistant':
+            md_text += f'## {gpt_name}：\n{msg["content"]}\n'
+    output = io.BytesIO()
+    output.write(md_text.encode('utf-8'))
+    output.seek(0)
+    return output
+def filename_correction(filename: str) -> str:
+    pattern = r'[^\w\.-]'
+    filename = re.sub(pattern, '', filename)
+    return filename
+def url_correction(text: str) -> str:
+    pattern = r'http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+#]|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+'
+    links = re.findall(pattern, text)
+    for link in links:
+        text = text.replace(link, " " + link + " ")
+    return text