icn_v2_DEMO

Sleeping

App Files Files Community

wop commited on Sep 28

Commit

8bae99c

•

1 Parent(s): 0f9e51d

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -25

app.py CHANGED Viewed

@@ -6,19 +6,6 @@ import time
 # Initialize the pipeline with the new model
 pipe = pipeline("text-generation", model="Blexus/Quble_test_model_v1_INSTRUCT_v1")
-DATABASE_PATH = "database.json"
-def load_database():
-    try:
-        with open(DATABASE_PATH, "r") as file:
-            return json.load(file)
-    except FileNotFoundError:
-        return {}
-def save_database(database):
-    with open(DATABASE_PATH, "w") as file:
-        json.dump(database, file)
 def format_prompt(message, system, history):
     prompt = f"SYSTEM: {system}\n<|endofsystem|>\n"
@@ -31,7 +18,6 @@ def format_prompt(message, system, history):
     return prompt
 def generate(prompt, system, history, temperature=0.9, max_new_tokens=4096, top_p=0.9, repetition_penalty=1.2):
-    database = load_database()
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
@@ -39,12 +25,8 @@ def generate(prompt, system, history, temperature=0.9, max_new_tokens=4096, top_
     formatted_prompt = format_prompt(prompt, system, history)
     response_text = "We are sorry but Quble doesn't know how to answer."
-    if formatted_prompt in database:
-        response_text = database[formatted_prompt]
-    else:
-        # Generate the response without streaming
-        try:
             response = pipe(formatted_prompt, max_new_tokens=max_new_tokens, temperature=temperature, top_p=top_p, repetition_penalty=repetition_penalty)[0]["generated_text"]
             response_text = response.split("ASSISTANT:")[-1].strip()
@@ -53,12 +35,9 @@ def generate(prompt, system, history, temperature=0.9, max_new_tokens=4096, top_
             for char in response_text:
                 accumulated_response += char  # Append the new character
                 yield accumulated_response  # Yield the accumulated response
-                time.sleep(0.05)  # Add a slight delay to simulate typing
-            # Save the generated response to the database after the response is generated
-            database[formatted_prompt] = response_text
-            save_database(database)
-        except Exception as e:
             print(f"Error generating response: {e}")
 customCSS = """

 # Initialize the pipeline with the new model
 pipe = pipeline("text-generation", model="Blexus/Quble_test_model_v1_INSTRUCT_v1")
 def format_prompt(message, system, history):
     prompt = f"SYSTEM: {system}\n<|endofsystem|>\n"
     return prompt
 def generate(prompt, system, history, temperature=0.9, max_new_tokens=4096, top_p=0.9, repetition_penalty=1.2):
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
     formatted_prompt = format_prompt(prompt, system, history)
     response_text = "We are sorry but Quble doesn't know how to answer."
+    # Generate the response without streaming
+    try:
             response = pipe(formatted_prompt, max_new_tokens=max_new_tokens, temperature=temperature, top_p=top_p, repetition_penalty=repetition_penalty)[0]["generated_text"]
             response_text = response.split("ASSISTANT:")[-1].strip()
             for char in response_text:
                 accumulated_response += char  # Append the new character
                 yield accumulated_response  # Yield the accumulated response
+                time.sleep(0.02)  # Add a slight delay to simulate typing
+    except Exception as e:
             print(f"Error generating response: {e}")
 customCSS = """