Spaces:

techconspartners
/

ConversAI

Sleeping

App Files Files Community

Rauhan commited on Aug 19, 2024

Commit

058f9cb

1 Parent(s): 74620ef

UPDATE: supabase

Browse files

Files changed (1) hide show

app.py +17 -3

app.py CHANGED Viewed

@@ -10,6 +10,8 @@ from src.api.speech_api import speech_translator_router
 from functions import client as supabase
 from urllib.parse import urlparse
 import nltk
 nltk.download('punkt_tab')
@@ -301,17 +303,29 @@ async def addText(addQaPair: AddQAPair):
 @app.post("/addWebsite")
 async def addWebsite(vectorstore: str, websiteUrls: list[str]):
     text = extractTextFromUrlList(urls = websiteUrls)
     username, chatbotname = vectorstore.split("$")[1], vectorstore.split("$")[2]
     df = pd.DataFrame(client.table("ConversAI_ChatbotInfo").select("*").execute().data)
     currentCount = df[(df["user_id"] == username) & (df["chatbotname"] == chatbotname)]["charactercount"].iloc[0]
     newCount = currentCount + len(text)
-    limit = client.table("ConversAI_UserConfig").select("tokenLimit").eq("user_id", username).execute().data[0][
-        "tokenLimit"]
     if newCount < int(limit):
         client.table("ConversAI_ChatbotInfo").update({"charactercount": str(newCount)}).eq("user_id", username).eq(
             "chatbotname", chatbotname).execute()
-        return addDocuments(text=text, source=urlparse(websiteUrls[0]).netloc, vectorstore=vectorstore)
     else:
         return {
             "output": "WEBSITE EXCEEDING LIMITS, PLEASE TRY WITH A SMALLER DOCUMENT."

 from functions import client as supabase
 from urllib.parse import urlparse
 import nltk
+import time
+import uuid
 nltk.download('punkt_tab')
 @app.post("/addWebsite")
 async def addWebsite(vectorstore: str, websiteUrls: list[str]):
+    start = time.time()
     text = extractTextFromUrlList(urls = websiteUrls)
+    textExtraction = time.time()
+    timeTaken = f"TEXT EXTRACTION TIME: {textExtraction - start}s" + "\n"
+    links = "LINKS:\n" + "\n".join(websiteUrls) + "\n"
+    newText = timeTaken + links + "TEXT: \n" + text
+    fileId = str(uuid.uuid4())
+    with open(f"{fileId}.txt", "w") as file:
+        file.write(newText)
+    with open(f"{fileId}.txt", "rb") as f:
+        supabase.storage.from_("ConversAI").upload(file = f, path = os.path.join("/", f.name), file_options={"content-type": "text/plain"})
+    os.remove(f"{fileId}.txt")
     username, chatbotname = vectorstore.split("$")[1], vectorstore.split("$")[2]
     df = pd.DataFrame(client.table("ConversAI_ChatbotInfo").select("*").execute().data)
     currentCount = df[(df["user_id"] == username) & (df["chatbotname"] == chatbotname)]["charactercount"].iloc[0]
     newCount = currentCount + len(text)
+    limit = client.table("ConversAI_UserConfig").select("tokenLimit").eq("user_id", username).execute().data[0]["tokenLimit"]
     if newCount < int(limit):
         client.table("ConversAI_ChatbotInfo").update({"charactercount": str(newCount)}).eq("user_id", username).eq(
             "chatbotname", chatbotname).execute()
+        output = addDocuments(text=text, source=urlparse(websiteUrls[0]).netloc, vectorstore=vectorstore)
+        output["supabaseFileName"] = f"{fileId}.txt"
+        return output
     else:
         return {
             "output": "WEBSITE EXCEEDING LIMITS, PLEASE TRY WITH A SMALLER DOCUMENT."