Spaces:

Mykes
/

rumed-phi3-mini

Sleeping

Mykes commited on Jul 14, 2024

Commit

a13e583

verified ·

1 Parent(s): c90d5be

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -41,14 +41,14 @@ def load_model():
         repo_id="Mykes/med_phi3-mini-4k-GGUF",
         filename="*Q4_K_M.gguf",
         verbose=False,
-        n_ctx=256,  # Reduced context window
-        n_batch=8,  # Smaller batch size
-        n_threads=2,  # Adjust based on your CPU cores
         use_mmap=True,
-        # n_ctx=1024,
-        # n_batch=512,
-        # n_threads=8,
-        # use_mlock=True,
         # use_mmap=True,
     )
@@ -110,7 +110,7 @@ if prompt := st.chat_input("What is your question?"):
     st.session_state.messages.append({"role": "user", "content": prompt})
     # Format the context with the last 5 messages
-    context = format_context(st.session_state.messages[-5:])
     # Prepare the model input
     model_input = f"{context}Human: {prompt}\nAssistant:"

         repo_id="Mykes/med_phi3-mini-4k-GGUF",
         filename="*Q4_K_M.gguf",
         verbose=False,
+        n_ctx=512,
+        n_batch=512,
+        n_threads=8,
+        use_mlock=True,
         use_mmap=True,
+        # n_ctx=256,  # Reduced context window
+        # n_batch=8,  # Smaller batch size
+        # n_threads=2,  # Adjust based on your CPU cores
         # use_mmap=True,
     )
     st.session_state.messages.append({"role": "user", "content": prompt})
     # Format the context with the last 5 messages
+    context = format_context(st.session_state.messages[-3:])
     # Prepare the model input
     model_input = f"{context}Human: {prompt}\nAssistant:"