Crypto_Market_Data_Agent

Sleeping

App Files Files Community

wphoenix commited on Feb 13

Commit

1464680

verified ·

1 Parent(s): b861b31

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -4

app.py CHANGED Viewed

@@ -36,16 +36,72 @@ def get_current_time_in_timezone(timezone: str) -> str:
 final_answer = FinalAnswerTool()
 # If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
 # model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
 model = HfApiModel(
-max_tokens=2096,
-temperature=0.5,
-model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud',# it is possible that this model may be overloaded
-custom_role_conversions=None,
 )
 # Import tool from Hub
 image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)

 final_answer = FinalAnswerTool()
+############# MODEL SELECTION ################################################
 # If the agent does not answer, the model is overloaded, please use another model or the following Hugging Face Endpoint that also contains qwen2.5 coder:
 # model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
+# model = HfApiModel(
+# max_tokens=2096,
+# temperature=0.5,
+# model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud',# it is possible that this model may be overloaded
+# custom_role_conversions=None,
+# )
+MODEL_IDS = [
+    #'https://wxknx1kg971u7k1n.us-east-1.aws.endpoints.huggingface.cloud/',
+    #'https://jc26mwg228mkj8dw.us-east-1.aws.endpoints.huggingface.cloud/',
+    # 'https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud'
+    #'meta-llama/Llama-3.2-1B-Instruct', ## Does a poor job of interpreting my questions and matching them to the tools
+    'Qwen/Qwen2.5-Coder-32B-Instruct',
+    'Qwen/Qwen2.5-Coder-14B-Instruct',
+    'Qwen/Qwen2.5-Coder-7B-Instruct',
+    'Qwen/Qwen2.5-Coder-3B-Instruct',
+    'Qwen/Qwen2.5-Coder-1.5B-Instruct'
+    # Add here wherever model is working for you
+]
+def is_model_overloaded(model_url):
+    """Verify if the model is overloaded doing a test call."""
+    try:
+        response = requests.post(model_url, json={"inputs": "Test"})
+        if verbose:
+            print(response.status_code)
+        if response.status_code == 503:  # 503 Service Unavailable = Overloaded
+            return True
+        if response.status_code == 404:  # 404 Client Error: Not Found
+            return True
+        if response.status_code == 424:  # 424 Client Error: Failed Dependency for url:
+            return True
+        return False
+    except requests.RequestException:
+        return True  # if there are an error is overloaded
+def get_available_model():
+    """Select the first model available from the list."""
+    for model_url in MODEL_IDS:
+        print("trying",model_url)
+        if not is_model_overloaded(model_url):
+            return model_url
+    return MODEL_IDS[0]  # if all are failing, use the first model by dfault
+if verbose: print("Checking available models.")
+selected_model_id = get_available_model()
 model = HfApiModel(
+    max_tokens=1048,
+    temperature=0.5,
+    #model_id='meta-llama/Llama-3.2-1B-Instruct',
+    #model_id='Qwen/Qwen2.5-Coder-32B-Instruct',
+    #model_id = 'Qwen/Qwen2.5-Coder-1.5B-Instruct',
+    model_id = selected_model_id, # model available selected from the list automatically
+    custom_role_conversions=None,
 )
+############# END: MODEL SELECTION ################################################
 # Import tool from Hub
 image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)