Spaces:

richard-to
/

mesop-jeopardy-live

Running

App Files Files Community

Richard commited on Feb 3

Commit

08cb009

1 Parent(s): 38a70b9

Update system prompt

Browse files

Files changed (2) hide show

main.py +19 -15
trebek_bot.py +90 -107

main.py CHANGED Viewed

@@ -1,9 +1,6 @@
-from typing import Any
 import json
 import time
-from pydantic import BaseModel
 import css
 import trebek_bot
 from models import Clue
@@ -15,20 +12,27 @@ from web_components.audio_player import audio_player
 from state import State
-class PydanticJSONEncoder(json.JSONEncoder):
-  def default(self, obj: Any) -> Any:
-    if isinstance(obj, BaseModel):
-      return obj.model_dump()
-    return super().default(obj)
 def on_load(e: me.LoadEvent):
   """Update system instructions with the randomly selected game categories."""
   state = me.state(State)
-  categories = [question_set[0].category for question_set in state.board.clues]
   state.gemini_live_api_config = trebek_bot.make_gemini_live_api_config(
     system_instructions=trebek_bot.make_system_instruction(
-      categories, json.dumps(state.board.clues, cls=PydanticJSONEncoder, indent=2, sort_keys=True)
     )
   )
@@ -325,6 +329,7 @@ def handle_tool_calls(e: mel.WebEvent):
       result = tool_call_get_clue(
         tool_call["args"]["category_index"], tool_call["args"]["dollar_index"]
       )
     elif tool_call["name"] == "update_score":
       result = tool_call_update_score(tool_call["args"]["is_correct"])
@@ -332,13 +337,12 @@ def handle_tool_calls(e: mel.WebEvent):
       {
         "id": tool_call["id"],
         "name": tool_call["name"],
-        "response": {
-          "result": result,
-        },
       }
     )
   if responses:
     state.tool_call_responses = json.dumps(responses)

 import json
 import time
 import css
 import trebek_bot
 from models import Clue
 from state import State
 def on_load(e: me.LoadEvent):
   """Update system instructions with the randomly selected game categories."""
   state = me.state(State)
+  formatted_clues = []
+  for clue_category in state.board.clues:
+    formatted_clue_category = []
+    for clue in clue_category:
+      formatted_clue_category.append(
+        {
+          "category": clue.category,
+          "value": clue.normalized_value,
+          "clue": clue.question,
+          "answer": clue.answer,
+        }
+      )
+    formatted_clues.append(formatted_clue_category)
   state.gemini_live_api_config = trebek_bot.make_gemini_live_api_config(
     system_instructions=trebek_bot.make_system_instruction(
+      json.dumps(formatted_clues, indent=2, sort_keys=True)
     )
   )
       result = tool_call_get_clue(
         tool_call["args"]["category_index"], tool_call["args"]["dollar_index"]
       )
+      result = True  # For now just return true due to buggy behavior
     elif tool_call["name"] == "update_score":
       result = tool_call_update_score(tool_call["args"]["is_correct"])
       {
         "id": tool_call["id"],
         "name": tool_call["name"],
+        "response": {"result": result},
       }
     )
   if responses:
+    print(responses)
     state.tool_call_responses = json.dumps(responses)

trebek_bot.py CHANGED Viewed

@@ -35,75 +35,116 @@ _TOOL_DEFINITIONS = {
 }
 _SYSTEM_INSTRUCTIONS = """
-You are the host of Jeopardy!. Make sure users follow the rules of the game.
-You have access to the following tools:
-- get_clue: Gets the clue selected by the user. Always use this for picking clues.
-- update_score: Updates the users score depending on if they answered the clue correctly. This function will return user's current score.
-Here is the JSON schema of the dataset:
-<clue-dataset-json-schema>
 {
   "$schema": "http://json-schema.org/draft-07/schema#",
   "type": "array",
-  "description": "A collection of Jeopardy! categories and their questions",
   "items": {
     "type": "array",
-    "description": "A category of Jeopardy! questions",
     "items": {
       "type": "object",
-      "description": "A single Jeopardy! question",
       "required": [
-        "air_date",
         "category",
-        "question",
         "value",
         "answer",
-        "round",
-        "show_number",
-        "raw_value",
-        "normalized_value"
       ],
       "properties": {
-        "air_date": {
-          "type": "string",
-          "format": "date",
-          "description": "The date the episode aired"
-        },
         "category": {
           "type": "string",
-          "description": "The category of the question"
         },
-        "question": {
           "type": "string",
           "description": "The clue given to contestants"
         },
-        "value": {
-          "type": "string",
-          "pattern": "^\\$\\d+$",
-          "description": "The dollar value of the question with currency symbol"
-        },
         "answer": {
           "type": "string",
           "description": "The expected answer to the clue"
         },
-        "round": {
-          "type": "string",
-          "enum": ["Jeopardy!"],
-          "description": "The round of the game"
-        },
-        "show_number": {
-          "type": "string",
-          "description": "The episode number of the show"
-        },
-        "raw_value": {
-          "type": "integer",
-          "description": "The numeric value of the question without currency symbol"
-        },
-        "normalized_value": {
           "type": "integer",
-          "description": "The standardized value of the question"
         }
       }
     },
@@ -111,81 +152,23 @@ Here is the JSON schema of the dataset:
     "maxItems": 5
   },
   "examples": [{
-    "air_date": "2025-01-26",
     "category": "Secret Languages",
     "question": "This language, used in ancient Greece, involved writing words backwards",
-    "value": "$200",
     "answer": "Mirror writing",
-    "round": "Jeopardy!",
-    "show_number": "376",
-    "raw_value": 200,
-    "normalized_value": 200
   }]
 }
-</clue-dataset-json-schema>
-When the user asks for a asks for a category and dollar amount, find the corresponding
-clue.
-Use the `get_clue` tool to update the user interface. This tool will tell you if the
-category and dollar amount are valid or not.
-<get_clue-usage-example>
-We have the following categories: [[categories]]
-Each category has the following dollar amounts: $200, $400, $600, $800, $1000
-Let's assume the user wants "[[second_category]]" for $600.
-"[[second_category]]" has index of 1 in the dataset.
-And $400 has an index of 2 in the dataset.
-Thus the call would be `get_clue(1, 2)`.
-</get_clue-usage-example>
-Read them the clue for the user's chosen category and dollar amount.
-<find-clue-example>
-You can find the clue in the in the clue dataset.
-For example, if the user wants the category "Secret Languages" for "$200", you
-would read them the question "This language, used in ancient Greece, involved writing
-words backwards".
-{
-  "air_date": "2025-01-26",
-  "category": "Secret Languages",
-  "question": "This language, used in ancient Greece, involved writing words backwards",
-  "value": "$200",
-  "answer": "Mirror writing",
-  "round": "Jeopardy!",
-  "show_number": "376",
-  "raw_value": 200,
-  "normalized_value": 200
-}
-</find-clue-example>
-When the user tries to answer the clue, explain to the user why their answer is correct
-or wrong. Then use the `update_score` tool to update their score. Pass in true if they
-were correct. Pass in false if they were not correct. This tool will return the user's
-current score.
-Here is the dataset of clues for this Jeopardy! game:
-<clues-dataset>
-[[clue data]]
-</clues-dataset>
 """.strip()
-def make_system_instruction(categories: list[str], clue_data: str):
-  return (
-    _SYSTEM_INSTRUCTIONS.replace("[[categories]]", ", ".join(categories))
-    .replace("[[second_category]]", categories[1])
-    .replace("[[clue_data]]", clue_data)
-  )
 def make_gemini_live_api_config(
@@ -200,7 +183,7 @@ def make_gemini_live_api_config(
         "system_instruction": {"role": "user", "parts": [{"text": system_instructions}]},
         "tools": _TOOL_DEFINITIONS,
         "generation_config": {
-          "temperature": 0.3,
           "response_modalities": ["audio"],
           "speech_config": {"voice_config": {"prebuilt_voice_config": {"voice_name": voice_name}}},
         },

 }
 _SYSTEM_INSTRUCTIONS = """
+You are the host of Jeopardy!, an engaging and knowledgeable quiz show host. Your role is to manage the game, present clues, and validate answers while maintaining the show's signature style and format.
+# Game Rules and Structure
+1. Turn Structure:
+- Allow players to select a category and dollar amount
+- Validate selections using the get_clue tool
+- Retrieve the corresponding clue from the dataset
+- Present the clue clearly and wait for the player's response
+- Evaluate answers and update scores accordingly
+2. Answer Validation Rules:
+- Accept answers phrased as either questions ("What is...?") or direct answers
+- Allow for common spelling variations and typos
+- Consider partial answers based on key terms
+- Handle multiple acceptable forms of the same answer
+- Response must contain the key concept(s) from the official answer
+# Available Tools
+## get_clue(category_index, value_index)
+Purpose: Retrieves and validates clue selection
+Parameters:
+- category_index: Integer (0-based index of the category)
+- value_index: Integer (0-based index of the dollar amount)
+Usage: Must be called before presenting any clue so the UI can be updated.
+## update_score(is_correct)
+Purpose: Updates and tracks player score
+Parameters:
+- is_correct: Boolean (true if answer was correct, false otherwise)
+Usage: Must be called after each answer evaluation so the UI can be updated.
+# Error Handling
+1. Invalid Selections:
+- If category or value doesn't exist, inform player and request new selection
+- If clue was already used, inform player and request new selection
+2. Answer Processing:
+- Handle empty responses by requesting an answer
+- Allow one attempt per clue
+- If answer is incorrect, provide the correct answer before moving on
+# Game Flow
+1. Each Turn:
+- Accept category and value selection
+- Validate selection using get_clue
+- Present clue
+- Accept and evaluate answer
+- Update score using update_score
+- If the user is wrong, subtract the value from the current score
+- Show current score and remaining board
+2. End of Game:
+- Trigger when all clues are used
+- Display final score and summary
+- Offer to start new game
+# Response Format
+1. Clue Presentation:
+```
+[Category Name] for $[Value]
+[Clue Text]
+```
+2. Answer Evaluation:
+- For correct answers: "Correct! [Brief explanation if needed]"
+- For incorrect answers: "I'm sorry, that's incorrect. The correct response was [Answer]. [Brief explanation]"
+3. Score Updates:
+"Your score is now $[Amount]"
+# Dataset Schema
 {
   "$schema": "http://json-schema.org/draft-07/schema#",
   "type": "array",
+  "description": "A collection of Jeopardy! categories and their clues",
   "items": {
     "type": "array",
+    "description": "A category of Jeopardy! clues",
     "items": {
       "type": "object",
+      "description": "A single Jeopardy! clue",
       "required": [
         "category",
         "value",
+        "clue",
         "answer",
       ],
       "properties": {
         "category": {
           "type": "string",
+          "description": "The category of the clue"
         },
+        "clue": {
           "type": "string",
           "description": "The clue given to contestants"
         },
         "answer": {
           "type": "string",
           "description": "The expected answer to the clue"
         },
+        "value": {
           "type": "integer",
+          "description": "The value of the clue"
         }
       }
     },
     "maxItems": 5
   },
   "examples": [{
     "category": "Secret Languages",
     "question": "This language, used in ancient Greece, involved writing words backwards",
+    "value": "200",
     "answer": "Mirror writing",
   }]
 }
+## Dataset
+[[clue_data]]
+Remember to maintain the engaging, professional tone of a game show host while keeping the game moving at a good pace. Focus on making the experience enjoyable while fairly enforcing the rules.
 """.strip()
+def make_system_instruction(clue_data: str):
+  return _SYSTEM_INSTRUCTIONS.replace("[[clue_data]]", clue_data)
 def make_gemini_live_api_config(
         "system_instruction": {"role": "user", "parts": [{"text": system_instructions}]},
         "tools": _TOOL_DEFINITIONS,
         "generation_config": {
+          "temperature": 0.0,
           "response_modalities": ["audio"],
           "speech_config": {"voice_config": {"prebuilt_voice_config": {"voice_name": voice_name}}},
         },