Spaces:

qanta-challenge
/

quizbowl-submission

Running

App Files Files Community

Maharshi Gor commited on Apr 3

Commit

2900a81

1 Parent(s): d15e788

Bugfix: llm model calls for Anthropic and gpt-3.5

Browse files

Files changed (1) hide show

src/llms.py +68 -44

src/llms.py CHANGED Viewed

@@ -4,60 +4,38 @@ import os
 from typing import Optional
 import cohere
-import json_repair
 import numpy as np
-from anthropic import Anthropic
 from langchain_anthropic import ChatAnthropic
 from langchain_cohere import ChatCohere
 from langchain_openai import ChatOpenAI
 from openai import OpenAI
 from pydantic import BaseModel, Field
 from rich import print as rprint
-import utils
 from app_configs import AVAILABLE_MODELS
 class LLMOutput(BaseModel):
     content: str = Field(description="The content of the response")
     logprob: Optional[float] = Field(None, description="The log probability of the response")
-def completion(model: str, system: str, prompt: str, response_format, logprobs: bool = False) -> str:
-    """
-    Generate a completion from an LLM provider with structured output.
-    Args:
-        model (str): Provider and model name in format "provider/model" (e.g. "OpenAI/gpt-4")
-        system (str): System prompt/instructions for the model
-        prompt (str): User prompt/input
-        response_format: Pydantic model defining the expected response structure
-        logprobs (bool, optional): Whether to return log probabilities. Defaults to False.
-            Note: Not supported by Anthropic models.
-    Returns:
-        dict: Contains:
-            - output: The structured response matching response_format
-            - logprob: (optional) Sum of log probabilities if logprobs=True
-            - prob: (optional) Exponential of logprob if logprobs=True
-    Raises:
-        ValueError: If logprobs=True with Anthropic models
-    """
-    if model not in AVAILABLE_MODELS:
-        raise ValueError(f"Model {model} not supported")
-    model_name = AVAILABLE_MODELS[model]["model"]
-    provider = model.split("/")[0]
-    if provider == "Cohere":
-        return _cohere_completion(model_name, system, prompt, response_format, logprobs)
-    elif provider == "OpenAI":
-        return _openai_completion(model_name, system, prompt, response_format, logprobs)
-    elif provider == "Anthropic":
-        if logprobs:
-            raise ValueError("Anthropic does not support logprobs")
-        return _anthropic_completion(model_name, system, prompt, response_format)
-    else:
-        raise ValueError(f"Provider {provider} not supported")
 def _cohere_completion(model: str, system: str, prompt: str, response_model, logprobs: bool = True) -> str:
@@ -81,6 +59,11 @@ def _cohere_completion(model: str, system: str, prompt: str, response_model, log
     return output
 def _openai_completion(model: str, system: str, prompt: str, response_model, logprobs: bool = True) -> str:
     messages = [
         {"role": "system", "content": system},
@@ -104,11 +87,52 @@ def _openai_completion(model: str, system: str, prompt: str, response_model, log
 def _anthropic_completion(model: str, system: str, prompt: str, response_model) -> str:
     llm = ChatAnthropic(model=model).with_structured_output(response_model, include_raw=True)
-    output = llm.invoke([("system", system), ("human", prompt)])
-    return {"content": output.raw, "output": output.parsed.model_dump()}
 if __name__ == "__main__":
     class ExplainedAnswer(BaseModel):
         """
@@ -118,12 +142,12 @@ if __name__ == "__main__":
         answer: str = Field(description="The short answer to the question")
         explanation: str = Field(description="5 words terse best explanation of the answer.")
-    model = "Anthropic/claude-3-5-sonnet-20240620"
     system = "You are an accurate and concise explainer of scientific concepts."
     prompt = "Which planet is closest to the sun in the Milky Way galaxy? Answer directly, no explanation needed."
-    # response = _cohere_completion("command-r", system, prompt, ExplainedAnswer, logprobs=True)
-    response = completion(model, system, prompt, ExplainedAnswer, logprobs=False)
-    rprint(response)
 # %%

 from typing import Optional
 import cohere
 import numpy as np
 from langchain_anthropic import ChatAnthropic
 from langchain_cohere import ChatCohere
 from langchain_openai import ChatOpenAI
+from loguru import logger
 from openai import OpenAI
 from pydantic import BaseModel, Field
 from rich import print as rprint
 from app_configs import AVAILABLE_MODELS
+def _openai_is_json_mode_supported(model_name: str) -> bool:
+    if model_name.startswith("gpt-4"):
+        return True
+    if model_name.startswith("gpt-3.5"):
+        return False
+    logger.warning(f"OpenAI model {model_name} is not available in this app, skipping JSON mode, returning False")
+    return False
 class LLMOutput(BaseModel):
     content: str = Field(description="The content of the response")
     logprob: Optional[float] = Field(None, description="The log probability of the response")
+def _get_langchain_chat_output(llm, system: str, prompt: str) -> str:
+    output = llm.invoke([("system", system), ("human", prompt)])
+    ai_message = output["raw"]
+    content = {"content": ai_message.content, "tool_calls": ai_message.tool_calls}
+    content_str = json.dumps(content)
+    return {"content": content_str, "output": output["parsed"].model_dump()}
 def _cohere_completion(model: str, system: str, prompt: str, response_model, logprobs: bool = True) -> str:
     return output
+def _openai_langchain_completion(model: str, system: str, prompt: str, response_model, logprobs: bool = True) -> str:
+    llm = ChatOpenAI(model=model).with_structured_output(response_model, include_raw=True)
+    return _get_langchain_chat_output(llm, system, prompt)
 def _openai_completion(model: str, system: str, prompt: str, response_model, logprobs: bool = True) -> str:
     messages = [
         {"role": "system", "content": system},
 def _anthropic_completion(model: str, system: str, prompt: str, response_model) -> str:
     llm = ChatAnthropic(model=model).with_structured_output(response_model, include_raw=True)
+    return _get_langchain_chat_output(llm, system, prompt)
+def completion(model: str, system: str, prompt: str, response_format, logprobs: bool = False) -> str:
+    """
+    Generate a completion from an LLM provider with structured output.
+    Args:
+        model (str): Provider and model name in format "provider/model" (e.g. "OpenAI/gpt-4")
+        system (str): System prompt/instructions for the model
+        prompt (str): User prompt/input
+        response_format: Pydantic model defining the expected response structure
+        logprobs (bool, optional): Whether to return log probabilities. Defaults to False.
+            Note: Not supported by Anthropic models.
+    Returns:
+        dict: Contains:
+            - output: The structured response matching response_format
+            - logprob: (optional) Sum of log probabilities if logprobs=True
+            - prob: (optional) Exponential of logprob if logprobs=True
+    Raises:
+        ValueError: If logprobs=True with Anthropic models
+    """
+    if model not in AVAILABLE_MODELS:
+        raise ValueError(f"Model {model} not supported")
+    model_name = AVAILABLE_MODELS[model]["model"]
+    provider = model.split("/")[0]
+    if provider == "Cohere":
+        return _cohere_completion(model_name, system, prompt, response_format, logprobs)
+    elif provider == "OpenAI":
+        if _openai_is_json_mode_supported(model_name):
+            return _openai_completion(model_name, system, prompt, response_format, logprobs)
+        else:
+            return _openai_langchain_completion(model_name, system, prompt, response_format, logprobs)
+    elif provider == "Anthropic":
+        if logprobs:
+            raise ValueError("Anthropic does not support logprobs")
+        return _anthropic_completion(model_name, system, prompt, response_format)
+    else:
+        raise ValueError(f"Provider {provider} not supported")
+# %%
 if __name__ == "__main__":
+    from tqdm import tqdm
     class ExplainedAnswer(BaseModel):
         """
         answer: str = Field(description="The short answer to the question")
         explanation: str = Field(description="5 words terse best explanation of the answer.")
+    models = AVAILABLE_MODELS.keys()
     system = "You are an accurate and concise explainer of scientific concepts."
     prompt = "Which planet is closest to the sun in the Milky Way galaxy? Answer directly, no explanation needed."
+    for model in tqdm(models):
+        response = completion(model, system, prompt, ExplainedAnswer, logprobs=False)
+        rprint(response)
 # %%