Spaces:

ashmib
/

user-feedback

Running

App Files Files Community

Ashmi Banerjee commited on Feb 1

Commit

88f694a

1 Parent(s): 8c5eede

made it work for merged data

Browse files

Files changed (6) hide show

app.py +2 -13
dummy_qa_data.csv +0 -11
test.py +138 -0
utils/loaders.py +1 -2
utils/notebooks/Data Merging.ipynb +858 -0
views/questions_screen.py +4 -4

app.py CHANGED Viewed

@@ -1,5 +1,3 @@
-import json
-from typing import Dict
 from utils.loaders import load_data
 from db.crud import read
 import streamlit as st
@@ -9,20 +7,11 @@ from views.intro_screen import welcome_screen
 from views.questions_screen import questions_screen, survey_completed
 from views.continue_survey import continue_survey_screen
 from css.layout import custom_css
 load_dotenv()
 VALIDATION_CODE = os.getenv("VALIDATION_CODE")
-if "VALIDATION_CODE" in os.environ:
-    VALIDATION_CODE = os.getenv("VALIDATION_CODE")
-if "DATA_REPO" in os.environ:
-    REPO_NAME = os.getenv("DATA_REPO")
-else:
-    print("DATA_REPO not found in environment variables.")
-if "GEMINI_DATA_FILES" in os.environ:
-    DATA_FILES = os.getenv("GEMINI_DATA_FILES")
-else:
-    print("LLAMA_DATA_FILES not found in environment variables.")
 def initialization():

 from utils.loaders import load_data
 from db.crud import read
 import streamlit as st
 from views.questions_screen import questions_screen, survey_completed
 from views.continue_survey import continue_survey_screen
 from css.layout import custom_css
+# st.set_page_config(layout="wide")
 load_dotenv()
 VALIDATION_CODE = os.getenv("VALIDATION_CODE")
 def initialization():

dummy_qa_data.csv DELETED Viewed

@@ -1,11 +0,0 @@
-q_id,Question,Generated Answer
-q_1,What is the capital of France?,The capital of France is Paris.
-q_2,Who wrote 'To Kill a Mockingbird'?,Harper Lee wrote 'To Kill a Mockingbird'.
-q_3,What is the largest planet in our solar system?,Jupiter is the largest planet in our solar system.
-q_4,Define photosynthesis.,Photosynthesis is the process by which green plants use sunlight to synthesize foods.
-q_5,Who painted the Mona Lisa?,Leonardo da Vinci painted the Mona Lisa.
-q_6,What is the speed of light?,"The speed of light is approximately 299,792 kilometers per second."
-q_7,Explain the theory of relativity.,"The theory of relativity, developed by Albert Einstein, explains the relationship between space and time."
-q_8,What is the chemical formula for water?,The chemical formula for water is H2O.
-q_9,Who discovered penicillin?,Alexander Fleming discovered penicillin.
-q_10,What is the square root of 64?,The square root of 64 is 8.

test.py ADDED Viewed

	@@ -0,0 +1,138 @@

+import streamlit as st
+import pandas as pd
+# Sample Data (Replace with your actual data loading)
+data = {
+    'query_v': {
+        'gemini': 'Cheap European city break in February.',
+        'llama': 'Affordable European trip in February.',
+    },
+    'query_p0': {
+        'gemini': 'European city break in February, less crowded destinations.',
+         'llama': 'February European city break, away from the crowds.',
+    },
+    'query_p1': {
+        'gemini': 'Best European cities for intense physical training and recovery with easy access to ice rinks?',
+        'llama': 'Top European cities for intense training and recovery with ice rinks?',
+    },
+}
+# Sample rating data (Replace this with your actual data)
+rating_data = {
+    'gemini': {
+        'query_v': {'relevance': 'Not Relevant', 'clarity': 'Not Clear'},
+        'query_p0': {'relevance': 'Not Relevant', 'clarity': 'Not Clear', 'persona_alignment': 'N/A'},
+        'query_p1': {'relevance': 'N/A', 'clarity': 'N/A', 'persona_alignment': 'N/A'},
+    },
+    'llama': {
+        'query_v': {'relevance': 'Somewhat Relevant', 'clarity': 'Somewhat Clear'},
+        'query_p0': {'relevance': 'Somewhat Relevant', 'clarity': 'Somewhat Clear', 'persona_alignment': 'Partially Aligned'},
+        'query_p1': {'relevance': 'Not Relevant', 'clarity': 'Not Clear', 'persona_alignment': 'Not Aligned'},
+    }
+}
+df = pd.DataFrame.from_dict(data)
+# Function to display query, rating, and controls for one query
+def display_query_section(query_type, query_text_gemini, query_text_llama, relevance_gemini, clarity_gemini, relevance_llama, clarity_llama, persona_alignment_gemini=None, persona_alignment_llama=None):
+    st.subheader(f"{query_type}")
+    col1, col2 = st.columns(2)
+    with col1:
+        st.markdown("Gemini")
+        st.write(query_text_gemini)
+        st.markdown("Relevance")
+        relevance_options = ['N/A', 'Not Relevant', 'Somewhat Relevant', 'Relevant', 'Unclear']
+        selected_relevance_gemini = st.radio("Relevance", options = relevance_options, key=f"relevance_{query_type}_gemini", index=relevance_options.index(relevance_gemini), horizontal=True)
+        st.markdown("Clarity")
+        clarity_options = ['N/A', 'Not Clear', 'Somewhat Clear', 'Very Clear']
+        selected_clarity_gemini = st.radio("Clarity", options = clarity_options, key=f"clarity_{query_type}_gemini", index=clarity_options.index(clarity_gemini), horizontal=True)
+        if persona_alignment_gemini:
+                st.markdown("Persona Alignment")
+                persona_options = ['N/A', 'Not Aligned', 'Partially Aligned', 'Aligned', 'Unclear']
+                selected_persona_alignment_gemini = st.radio("Persona Alignment", options = persona_options, key=f"persona_{query_type}_gemini", index=persona_options.index(persona_alignment_gemini), horizontal=True)
+    with col2:
+            st.markdown("Llama")
+            st.write(query_text_llama)
+            st.markdown("Relevance")
+            relevance_options_llama = ['N/A', 'Not Relevant', 'Somewhat Relevant', 'Relevant', 'Unclear']
+            selected_relevance_llama = st.radio("Relevance", options = relevance_options_llama, key=f"relevance_{query_type}_llama", index=relevance_options_llama.index(relevance_llama), horizontal=True)
+            st.markdown("Clarity")
+            clarity_options_llama = ['N/A', 'Not Clear', 'Somewhat Clear', 'Very Clear']
+            selected_clarity_llama = st.radio("Clarity", options = clarity_options_llama, key=f"clarity_{query_type}_llama", index=clarity_options_llama.index(clarity_llama), horizontal=True)
+            if persona_alignment_llama:
+                  st.markdown("Persona Alignment")
+                  persona_options_llama = ['N/A', 'Not Aligned', 'Partially Aligned', 'Aligned', 'Unclear']
+                  selected_persona_alignment_llama = st.radio("Persona Alignment", options = persona_options_llama, key=f"persona_{query_type}_llama", index=persona_options_llama.index(persona_alignment_llama), horizontal=True)
+# Main Streamlit App
+st.set_page_config(layout="wide")
+# Context Information
+st.title("Question 1 of 5")
+st.subheader("Config ID: c_p_0_pop_low_easy")
+st.markdown("### Context Information")
+with st.expander("Persona", expanded=True):
+    st.write("A top-scoring player in the local league who is also eyeing a professional career in the NHL")
+with st.expander("Filters & Cities", expanded=True):
+     st.write("Filters: {'popularity': 'low', 'month': 'February'}")
+     st.write("Cities: ['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhangelsk', 'Bacau', 'Baia Mare', 'Balikesir', 'Brest',\
+'Burgas', 'Canakkale', 'Craiova', 'Debrecen', 'Denizli', 'Diyarbakir', 'Elazig', 'Erzincan', 'Eskisehir',\
+'Gaziantep', 'lasi', 'Ioannina', 'Isparta', 'Jonkoping', 'Kahramanmaras', 'Kars', 'Kayseri', 'Konya', 'Kosice',\
+'Linkoping', 'Malatya', 'Miskolc', 'Mykolaiv', 'Nalchik', 'Nevsehir', 'Nis', 'Orebro', 'Orleans', 'Rivne',\
+'Rzeszow', 'Samsun', 'Sanliurfa', 'Sevilla', 'Siirt', 'Sivas', 'Syktyvkar', 'Targu-Mures', 'Tekirdag',\
+'Thessaloniki', 'Trabzon', 'Uzhhorod', 'Valladolid', 'Van', 'Vasteras', 'Vinnytsia', 'Vitoria-Gasteiz',\
+'Vladikavkaz', 'Zaporizhzhia', 'Zielona Gora', 'Batman', 'Erzurum']")
+# Display Query Sections
+display_query_section(
+    query_type="Query_v",
+    query_text_gemini=df.loc['gemini','query_v'],
+    query_text_llama=df.loc['llama','query_v'],
+    relevance_gemini=rating_data['gemini']['query_v']['relevance'],
+    clarity_gemini=rating_data['gemini']['query_v']['clarity'],
+    relevance_llama=rating_data['llama']['query_v']['relevance'],
+    clarity_llama=rating_data['llama']['query_v']['clarity'],
+)
+display_query_section(
+    query_type="Query_p0",
+    query_text_gemini=df.loc['gemini','query_p0'],
+    query_text_llama=df.loc['llama','query_p0'],
+    relevance_gemini=rating_data['gemini']['query_p0']['relevance'],
+    clarity_gemini=rating_data['gemini']['query_p0']['clarity'],
+     persona_alignment_gemini=rating_data['gemini']['query_p0']['persona_alignment'],
+    relevance_llama=rating_data['llama']['query_p0']['relevance'],
+    clarity_llama=rating_data['llama']['query_p0']['clarity'],
+    persona_alignment_llama=rating_data['llama']['query_p0']['persona_alignment'],
+)
+display_query_section(
+    query_type="Query_p1",
+    query_text_gemini=df.loc['gemini','query_p1'],
+     query_text_llama=df.loc['llama','query_p1'],
+    relevance_gemini=rating_data['gemini']['query_p1']['relevance'],
+    clarity_gemini=rating_data['gemini']['query_p1']['clarity'],
+    persona_alignment_gemini=rating_data['gemini']['query_p1']['persona_alignment'],
+    relevance_llama=rating_data['llama']['query_p1']['relevance'],
+    clarity_llama=rating_data['llama']['query_p1']['clarity'],
+    persona_alignment_llama=rating_data['llama']['query_p1']['persona_alignment'],
+)
+# Additional Comments
+st.markdown("Additional Comments (Optional):")
+st.text_area("", key="additional_comments")
+# Navigation Buttons
+col1, col2, col3 = st.columns([1,1,1])
+with col1:
+    st.button("Back")
+with col2:
+     st.button("Next")
+with col3:
+    st.button("Exit & Resume Later")
+# Bottom message
+st.markdown("Please provide a rating before proceeding.")

utils/loaders.py CHANGED Viewed

@@ -12,8 +12,7 @@ DATA_FILES = os.getenv("GEMINI_DATA_FILES")
 def load_data():
     try:
-        #TODO: change this to load the data from the database (buggy for debugging)
-        data = pd.read_csv("data/gemini_results_subset.csv")[:5]
         return data
     except Exception as e:

 def load_data():
     try:
+        data = pd.read_csv("data/user-evaluation/merged.csv")[:5]
         return data
     except Exception as e:

utils/notebooks/Data Merging.ipynb ADDED Viewed

	@@ -0,0 +1,858 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "a16bb8a1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import pandas as pd"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "4fc12e60",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(200, 9)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>config_id</th>\n",
+       "      <th>persona_id</th>\n",
+       "      <th>persona</th>\n",
+       "      <th>filters</th>\n",
+       "      <th>context</th>\n",
+       "      <th>city</th>\n",
+       "      <th>llama_query_v</th>\n",
+       "      <th>llama_query_p0</th>\n",
+       "      <th>llama_query_p1</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>c_p_0_pop_low_easy</td>\n",
+       "      <td>p_0</td>\n",
+       "      <td>A top-scoring player in the local league who i...</td>\n",
+       "      <td>{'popularity': 'low', 'month': 'February'}</td>\n",
+       "      <td>Adana has low popularity. Adana has low season...</td>\n",
+       "      <td>['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...</td>\n",
+       "      <td>\"Less crowded European cities to visit in Febr...</td>\n",
+       "      <td>\"European cities with ice hockey facilities, l...</td>\n",
+       "      <td>Based on the user's profile as a top-scoring p...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>c_p_1_pop_medium_medium</td>\n",
+       "      <td>p_1</td>\n",
+       "      <td>A former DJ at WSUM who is now working as a mu...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'medium', '...</td>\n",
+       "      <td>Coimbra has medium popularity and medium budge...</td>\n",
+       "      <td>['Coimbra', 'Brno', 'Braga']</td>\n",
+       "      <td>'medium budget European city breaks with parks...</td>\n",
+       "      <td>\"Medium budget European cities with parks and ...</td>\n",
+       "      <td>Based on the user's background as a former DJ ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>c_p_2_pop_high_hard</td>\n",
+       "      <td>p_2</td>\n",
+       "      <td>A fellow agent-turned-author who shares the sa...</td>\n",
+       "      <td>{'popularity': 'high', 'budget': 'low', 'inter...</td>\n",
+       "      <td>Zagreb has high popularity and low budget. Zag...</td>\n",
+       "      <td>['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...</td>\n",
+       "      <td>\"Looking for a popular and affordable European...</td>\n",
+       "      <td>\"Low-budget European cities with museums and n...</td>\n",
+       "      <td>Based on the provided information, I'm going t...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>c_p_3_pop_low_sustainable</td>\n",
+       "      <td>p_3</td>\n",
+       "      <td>a film critic who dislikes storylines involvin...</td>\n",
+       "      <td>{'popularity': 'low', 'interests': 'Outdoors &amp;...</td>\n",
+       "      <td>Van has low popularity. Van has low season in ...</td>\n",
+       "      <td>['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...</td>\n",
+       "      <td>\"European cities with low popularity, monaster...</td>\n",
+       "      <td>\"off the beaten path European city breaks in l...</td>\n",
+       "      <td>Based on the given information, I'll create a ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>c_p_4_pop_medium_easy</td>\n",
+       "      <td>p_4</td>\n",
+       "      <td>A biology major conducting research on equine ...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'high'}</td>\n",
+       "      <td>Aalborg has medium popularity and high budget....</td>\n",
+       "      <td>['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...</td>\n",
+       "      <td>\"European cities for a luxurious trip.\"</td>\n",
+       "      <td>\"European cities with horse riding trails and ...</td>\n",
+       "      <td>Based on the user's background and interests, ...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   config_id persona_id  \\\n",
+       "0         c_p_0_pop_low_easy        p_0   \n",
+       "1    c_p_1_pop_medium_medium        p_1   \n",
+       "2        c_p_2_pop_high_hard        p_2   \n",
+       "3  c_p_3_pop_low_sustainable        p_3   \n",
+       "4      c_p_4_pop_medium_easy        p_4   \n",
+       "\n",
+       "                                             persona  \\\n",
+       "0  A top-scoring player in the local league who i...   \n",
+       "1  A former DJ at WSUM who is now working as a mu...   \n",
+       "2  A fellow agent-turned-author who shares the sa...   \n",
+       "3  a film critic who dislikes storylines involvin...   \n",
+       "4  A biology major conducting research on equine ...   \n",
+       "\n",
+       "                                             filters  \\\n",
+       "0         {'popularity': 'low', 'month': 'February'}   \n",
+       "1  {'popularity': 'medium', 'budget': 'medium', '...   \n",
+       "2  {'popularity': 'high', 'budget': 'low', 'inter...   \n",
+       "3  {'popularity': 'low', 'interests': 'Outdoors &...   \n",
+       "4         {'popularity': 'medium', 'budget': 'high'}   \n",
+       "\n",
+       "                                             context  \\\n",
+       "0  Adana has low popularity. Adana has low season...   \n",
+       "1  Coimbra has medium popularity and medium budge...   \n",
+       "2  Zagreb has high popularity and low budget. Zag...   \n",
+       "3  Van has low popularity. Van has low season in ...   \n",
+       "4  Aalborg has medium popularity and high budget....   \n",
+       "\n",
+       "                                                city  \\\n",
+       "0  ['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...   \n",
+       "1                       ['Coimbra', 'Brno', 'Braga']   \n",
+       "2  ['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...   \n",
+       "3  ['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...   \n",
+       "4  ['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...   \n",
+       "\n",
+       "                                       llama_query_v  \\\n",
+       "0  \"Less crowded European cities to visit in Febr...   \n",
+       "1  'medium budget European city breaks with parks...   \n",
+       "2  \"Looking for a popular and affordable European...   \n",
+       "3  \"European cities with low popularity, monaster...   \n",
+       "4            \"European cities for a luxurious trip.\"   \n",
+       "\n",
+       "                                      llama_query_p0  \\\n",
+       "0  \"European cities with ice hockey facilities, l...   \n",
+       "1  \"Medium budget European cities with parks and ...   \n",
+       "2  \"Low-budget European cities with museums and n...   \n",
+       "3  \"off the beaten path European city breaks in l...   \n",
+       "4  \"European cities with horse riding trails and ...   \n",
+       "\n",
+       "                                      llama_query_p1  \n",
+       "0  Based on the user's profile as a top-scoring p...  \n",
+       "1  Based on the user's background as a former DJ ...  \n",
+       "2  Based on the provided information, I'm going t...  \n",
+       "3  Based on the given information, I'll create a ...  \n",
+       "4  Based on the user's background and interests, ...  "
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "llama = pd.read_csv(\"../../data/llama_results_subset.csv\")\n",
+    "# llama[\"model\"] = \"llama-3.2-90b\"\n",
+    "\n",
+    "llama.rename(columns={'query_v': \"llama_query_v\", 'query_p0': \"llama_query_p0\", \"query_p1\": \"llama_query_p1\"}, inplace = True)\n",
+    "\n",
+    "print(llama.shape)\n",
+    "llama.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "a651f27b",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(200, 9)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>config_id</th>\n",
+       "      <th>persona_id</th>\n",
+       "      <th>persona</th>\n",
+       "      <th>filters</th>\n",
+       "      <th>context</th>\n",
+       "      <th>city</th>\n",
+       "      <th>gemini_query_v</th>\n",
+       "      <th>gemini_query_p0</th>\n",
+       "      <th>gemini_query_p1</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>c_p_0_pop_low_easy</td>\n",
+       "      <td>p_0</td>\n",
+       "      <td>A top-scoring player in the local league who i...</td>\n",
+       "      <td>{'popularity': 'low', 'month': 'February'}</td>\n",
+       "      <td>Adana has low popularity. Adana has low season...</td>\n",
+       "      <td>['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...</td>\n",
+       "      <td>Cheap European city break in February.\\n</td>\n",
+       "      <td>European city break in February, less crowded ...</td>\n",
+       "      <td>Best European cities for intense physical trai...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>c_p_1_pop_medium_medium</td>\n",
+       "      <td>p_1</td>\n",
+       "      <td>A former DJ at WSUM who is now working as a mu...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'medium', '...</td>\n",
+       "      <td>Coimbra has medium popularity and medium budge...</td>\n",
+       "      <td>['Coimbra', 'Brno', 'Braga']</td>\n",
+       "      <td>Medium budget European city break with parks a...</td>\n",
+       "      <td>European city break, medium budget, good parks...</td>\n",
+       "      <td>Best European cities for live music, especiall...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>c_p_2_pop_high_hard</td>\n",
+       "      <td>p_2</td>\n",
+       "      <td>A fellow agent-turned-author who shares the sa...</td>\n",
+       "      <td>{'popularity': 'high', 'budget': 'low', 'inter...</td>\n",
+       "      <td>Zagreb has high popularity and low budget. Zag...</td>\n",
+       "      <td>['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...</td>\n",
+       "      <td>Cheap January city break in Europe with museum...</td>\n",
+       "      <td>European city break in January. Budget friendl...</td>\n",
+       "      <td>Where can I find inspiring European cities wit...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>c_p_3_pop_low_sustainable</td>\n",
+       "      <td>p_3</td>\n",
+       "      <td>a film critic who dislikes storylines involvin...</td>\n",
+       "      <td>{'popularity': 'low', 'interests': 'Outdoors &amp;...</td>\n",
+       "      <td>Van has low popularity. Van has low season in ...</td>\n",
+       "      <td>['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...</td>\n",
+       "      <td>Cheap European city break in January with inte...</td>\n",
+       "      <td>European city break in January. Low-budget des...</td>\n",
+       "      <td>Best European cities for unique, artistic expe...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>c_p_4_pop_medium_easy</td>\n",
+       "      <td>p_4</td>\n",
+       "      <td>A biology major conducting research on equine ...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'high'}</td>\n",
+       "      <td>Aalborg has medium popularity and high budget....</td>\n",
+       "      <td>['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...</td>\n",
+       "      <td>Suggest some moderately popular European citie...</td>\n",
+       "      <td>High-budget European city with equestrian attr...</td>\n",
+       "      <td>European cities with renowned veterinary or ag...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                   config_id persona_id  \\\n",
+       "0         c_p_0_pop_low_easy        p_0   \n",
+       "1    c_p_1_pop_medium_medium        p_1   \n",
+       "2        c_p_2_pop_high_hard        p_2   \n",
+       "3  c_p_3_pop_low_sustainable        p_3   \n",
+       "4      c_p_4_pop_medium_easy        p_4   \n",
+       "\n",
+       "                                             persona  \\\n",
+       "0  A top-scoring player in the local league who i...   \n",
+       "1  A former DJ at WSUM who is now working as a mu...   \n",
+       "2  A fellow agent-turned-author who shares the sa...   \n",
+       "3  a film critic who dislikes storylines involvin...   \n",
+       "4  A biology major conducting research on equine ...   \n",
+       "\n",
+       "                                             filters  \\\n",
+       "0         {'popularity': 'low', 'month': 'February'}   \n",
+       "1  {'popularity': 'medium', 'budget': 'medium', '...   \n",
+       "2  {'popularity': 'high', 'budget': 'low', 'inter...   \n",
+       "3  {'popularity': 'low', 'interests': 'Outdoors &...   \n",
+       "4         {'popularity': 'medium', 'budget': 'high'}   \n",
+       "\n",
+       "                                             context  \\\n",
+       "0  Adana has low popularity. Adana has low season...   \n",
+       "1  Coimbra has medium popularity and medium budge...   \n",
+       "2  Zagreb has high popularity and low budget. Zag...   \n",
+       "3  Van has low popularity. Van has low season in ...   \n",
+       "4  Aalborg has medium popularity and high budget....   \n",
+       "\n",
+       "                                                city  \\\n",
+       "0  ['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...   \n",
+       "1                       ['Coimbra', 'Brno', 'Braga']   \n",
+       "2  ['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...   \n",
+       "3  ['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...   \n",
+       "4  ['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...   \n",
+       "\n",
+       "                                      gemini_query_v  \\\n",
+       "0           Cheap European city break in February.\\n   \n",
+       "1  Medium budget European city break with parks a...   \n",
+       "2  Cheap January city break in Europe with museum...   \n",
+       "3  Cheap European city break in January with inte...   \n",
+       "4  Suggest some moderately popular European citie...   \n",
+       "\n",
+       "                                     gemini_query_p0  \\\n",
+       "0  European city break in February, less crowded ...   \n",
+       "1  European city break, medium budget, good parks...   \n",
+       "2  European city break in January. Budget friendl...   \n",
+       "3  European city break in January. Low-budget des...   \n",
+       "4  High-budget European city with equestrian attr...   \n",
+       "\n",
+       "                                     gemini_query_p1  \n",
+       "0  Best European cities for intense physical trai...  \n",
+       "1  Best European cities for live music, especiall...  \n",
+       "2  Where can I find inspiring European cities wit...  \n",
+       "3  Best European cities for unique, artistic expe...  \n",
+       "4  European cities with renowned veterinary or ag...  "
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "gemini = pd.read_csv(\"../../data/gemini_results_subset.csv\")\n",
+    "# gemini[\"model\"] = \"gemini-1.5-pro-002\"\n",
+    "gemini.rename(columns={'query_v': \"gemini_query_v\", 'query_p0': \"gemini_query_p0\", \"query_p1\": \"gemini_query_p1\"}, inplace = True)\n",
+    "\n",
+    "print(gemini.shape)\n",
+    "gemini.head()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "id": "dfd8102c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "6\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "['filters', 'city', 'context', 'config_id', 'persona', 'persona_id']"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "common_cols = list(set(list(gemini)).intersection(set(list(llama))))\n",
+    "print(len(common_cols))\n",
+    "common_cols"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "id": "32344df6",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(200, 12)\n"
+     ]
+    },
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>config_id</th>\n",
+       "      <th>persona_id</th>\n",
+       "      <th>persona</th>\n",
+       "      <th>filters</th>\n",
+       "      <th>context</th>\n",
+       "      <th>city</th>\n",
+       "      <th>gemini_query_v</th>\n",
+       "      <th>gemini_query_p0</th>\n",
+       "      <th>gemini_query_p1</th>\n",
+       "      <th>llama_query_v</th>\n",
+       "      <th>llama_query_p0</th>\n",
+       "      <th>llama_query_p1</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>c_p_0_pop_low_easy</td>\n",
+       "      <td>p_0</td>\n",
+       "      <td>A top-scoring player in the local league who i...</td>\n",
+       "      <td>{'popularity': 'low', 'month': 'February'}</td>\n",
+       "      <td>Adana has low popularity. Adana has low season...</td>\n",
+       "      <td>['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...</td>\n",
+       "      <td>Cheap European city break in February.\\n</td>\n",
+       "      <td>European city break in February, less crowded ...</td>\n",
+       "      <td>Best European cities for intense physical trai...</td>\n",
+       "      <td>\"Less crowded European cities to visit in Febr...</td>\n",
+       "      <td>\"European cities with ice hockey facilities, l...</td>\n",
+       "      <td>Based on the user's profile as a top-scoring p...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>c_p_1_pop_medium_medium</td>\n",
+       "      <td>p_1</td>\n",
+       "      <td>A former DJ at WSUM who is now working as a mu...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'medium', '...</td>\n",
+       "      <td>Coimbra has medium popularity and medium budge...</td>\n",
+       "      <td>['Coimbra', 'Brno', 'Braga']</td>\n",
+       "      <td>Medium budget European city break with parks a...</td>\n",
+       "      <td>European city break, medium budget, good parks...</td>\n",
+       "      <td>Best European cities for live music, especiall...</td>\n",
+       "      <td>'medium budget European city breaks with parks...</td>\n",
+       "      <td>\"Medium budget European cities with parks and ...</td>\n",
+       "      <td>Based on the user's background as a former DJ ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>c_p_2_pop_high_hard</td>\n",
+       "      <td>p_2</td>\n",
+       "      <td>A fellow agent-turned-author who shares the sa...</td>\n",
+       "      <td>{'popularity': 'high', 'budget': 'low', 'inter...</td>\n",
+       "      <td>Zagreb has high popularity and low budget. Zag...</td>\n",
+       "      <td>['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...</td>\n",
+       "      <td>Cheap January city break in Europe with museum...</td>\n",
+       "      <td>European city break in January. Budget friendl...</td>\n",
+       "      <td>Where can I find inspiring European cities wit...</td>\n",
+       "      <td>\"Looking for a popular and affordable European...</td>\n",
+       "      <td>\"Low-budget European cities with museums and n...</td>\n",
+       "      <td>Based on the provided information, I'm going t...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>c_p_3_pop_low_sustainable</td>\n",
+       "      <td>p_3</td>\n",
+       "      <td>a film critic who dislikes storylines involvin...</td>\n",
+       "      <td>{'popularity': 'low', 'interests': 'Outdoors &amp;...</td>\n",
+       "      <td>Van has low popularity. Van has low season in ...</td>\n",
+       "      <td>['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...</td>\n",
+       "      <td>Cheap European city break in January with inte...</td>\n",
+       "      <td>European city break in January. Low-budget des...</td>\n",
+       "      <td>Best European cities for unique, artistic expe...</td>\n",
+       "      <td>\"European cities with low popularity, monaster...</td>\n",
+       "      <td>\"off the beaten path European city breaks in l...</td>\n",
+       "      <td>Based on the given information, I'll create a ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>c_p_4_pop_medium_easy</td>\n",
+       "      <td>p_4</td>\n",
+       "      <td>A biology major conducting research on equine ...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'high'}</td>\n",
+       "      <td>Aalborg has medium popularity and high budget....</td>\n",
+       "      <td>['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...</td>\n",
+       "      <td>Suggest some moderately popular European citie...</td>\n",
+       "      <td>High-budget European city with equestrian attr...</td>\n",
+       "      <td>European cities with renowned veterinary or ag...</td>\n",
+       "      <td>\"European cities for a luxurious trip.\"</td>\n",
+       "      <td>\"European cities with horse riding trails and ...</td>\n",
+       "      <td>Based on the user's background and interests, ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>195</th>\n",
+       "      <td>c_p_8_pop_medium_easy</td>\n",
+       "      <td>p_8</td>\n",
+       "      <td>A junior Flash developer seeking guidance on c...</td>\n",
+       "      <td>{'popularity': 'medium', 'interests': 'Outdoor...</td>\n",
+       "      <td>Zaragoza has medium popularity. In Zaragoza yo...</td>\n",
+       "      <td>['Zaragoza', 'Varna', 'Turku', 'Tampere', 'Szc...</td>\n",
+       "      <td>Good places to swim outdoors in Europe\\n</td>\n",
+       "      <td>Good places for a Flash developer to visit in ...</td>\n",
+       "      <td>Best European cities for tech meetups &amp; cowork...</td>\n",
+       "      <td>\"European cities with medium popularity for ou...</td>\n",
+       "      <td>A junior Flash developer seeking guidance on c...</td>\n",
+       "      <td>Which European cities offer a mix of cultural ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>196</th>\n",
+       "      <td>c_p_9_pop_high_medium</td>\n",
+       "      <td>p_9</td>\n",
+       "      <td>An avid gamer who has played Sins of a Solar E...</td>\n",
+       "      <td>{'popularity': 'high', 'month': 'April', 'budg...</td>\n",
+       "      <td>Sarajevo has high popularity and medium budget...</td>\n",
+       "      <td>['Sarajevo', 'Tallinn', 'Vilnius', 'Belgrade',...</td>\n",
+       "      <td>Medium budget European city break in April wit...</td>\n",
+       "      <td>Budget-friendly European city break in April w...</td>\n",
+       "      <td>European cities with a grand, futuristic feel ...</td>\n",
+       "      <td>'medium budget trip in April to a popular Euro...</td>\n",
+       "      <td>\"Medium budget trip to a popular European city...</td>\n",
+       "      <td>Based on the user's interest in Sins of a Sola...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>197</th>\n",
+       "      <td>c_p_10_pop_low_hard</td>\n",
+       "      <td>p_10</td>\n",
+       "      <td>An atheist, philosophy lecturer who encourages...</td>\n",
+       "      <td>{'popularity': 'low', 'interests': 'Outdoors &amp;...</td>\n",
+       "      <td>Malatya has low popularity and high budget. Ma...</td>\n",
+       "      <td>['Malatya', 'Ioannina']</td>\n",
+       "      <td>High-budget European city trip in February wit...</td>\n",
+       "      <td>European city break in February. Low season &amp; ...</td>\n",
+       "      <td>Where can I find European cities rich in histo...</td>\n",
+       "      <td>\"Less crowded European destinations with water...</td>\n",
+       "      <td>\"Less crowded European destinations for a pric...</td>\n",
+       "      <td>Based on the provided information, I would gue...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>198</th>\n",
+       "      <td>c_p_11_pop_medium_sustainable</td>\n",
+       "      <td>p_11</td>\n",
+       "      <td>A young apprentice fascinated by the technolog...</td>\n",
+       "      <td>{'popularity': 'medium', 'budget': 'low', 'mon...</td>\n",
+       "      <td>Chelyabinsk has medium popularity , low budget...</td>\n",
+       "      <td>['Chelyabinsk', 'Kirov', 'Podgorica', 'Rijeka'...</td>\n",
+       "      <td>Suggest a low-budget, walkable European city b...</td>\n",
+       "      <td>Budget-friendly European city break in April, ...</td>\n",
+       "      <td>Which European cities offer glimpses into the ...</td>\n",
+       "      <td>\"European cities with great walkability and lo...</td>\n",
+       "      <td>\"European cities with industrial heritage site...</td>\n",
+       "      <td>Based on the user's interest in technological ...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>199</th>\n",
+       "      <td>c_p_12_pop_high_easy</td>\n",
+       "      <td>p_12</td>\n",
+       "      <td>A high school guidance counselor in Winnebago ...</td>\n",
+       "      <td>{'popularity': 'high', 'budget': 'medium'}</td>\n",
+       "      <td>Belgrade has high popularity and medium budget...</td>\n",
+       "      <td>['Belgrade', 'Bratislava', 'Budapest', 'Nicosi...</td>\n",
+       "      <td>Popular and affordable European city break des...</td>\n",
+       "      <td>Affordable, popular European capitals for a we...</td>\n",
+       "      <td>Affordable, safe European cities with historic...</td>\n",
+       "      <td>'medium budget european city breaks in popular...</td>\n",
+       "      <td>\"Medium budget city breaks in Europe for a sch...</td>\n",
+       "      <td>Based on the information provided, I'll make a...</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>200 rows × 12 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "                         config_id persona_id  \\\n",
+       "0               c_p_0_pop_low_easy        p_0   \n",
+       "1          c_p_1_pop_medium_medium        p_1   \n",
+       "2              c_p_2_pop_high_hard        p_2   \n",
+       "3        c_p_3_pop_low_sustainable        p_3   \n",
+       "4            c_p_4_pop_medium_easy        p_4   \n",
+       "..                             ...        ...   \n",
+       "195          c_p_8_pop_medium_easy        p_8   \n",
+       "196          c_p_9_pop_high_medium        p_9   \n",
+       "197            c_p_10_pop_low_hard       p_10   \n",
+       "198  c_p_11_pop_medium_sustainable       p_11   \n",
+       "199           c_p_12_pop_high_easy       p_12   \n",
+       "\n",
+       "                                               persona  \\\n",
+       "0    A top-scoring player in the local league who i...   \n",
+       "1    A former DJ at WSUM who is now working as a mu...   \n",
+       "2    A fellow agent-turned-author who shares the sa...   \n",
+       "3    a film critic who dislikes storylines involvin...   \n",
+       "4    A biology major conducting research on equine ...   \n",
+       "..                                                 ...   \n",
+       "195  A junior Flash developer seeking guidance on c...   \n",
+       "196  An avid gamer who has played Sins of a Solar E...   \n",
+       "197  An atheist, philosophy lecturer who encourages...   \n",
+       "198  A young apprentice fascinated by the technolog...   \n",
+       "199  A high school guidance counselor in Winnebago ...   \n",
+       "\n",
+       "                                               filters  \\\n",
+       "0           {'popularity': 'low', 'month': 'February'}   \n",
+       "1    {'popularity': 'medium', 'budget': 'medium', '...   \n",
+       "2    {'popularity': 'high', 'budget': 'low', 'inter...   \n",
+       "3    {'popularity': 'low', 'interests': 'Outdoors &...   \n",
+       "4           {'popularity': 'medium', 'budget': 'high'}   \n",
+       "..                                                 ...   \n",
+       "195  {'popularity': 'medium', 'interests': 'Outdoor...   \n",
+       "196  {'popularity': 'high', 'month': 'April', 'budg...   \n",
+       "197  {'popularity': 'low', 'interests': 'Outdoors &...   \n",
+       "198  {'popularity': 'medium', 'budget': 'low', 'mon...   \n",
+       "199         {'popularity': 'high', 'budget': 'medium'}   \n",
+       "\n",
+       "                                               context  \\\n",
+       "0    Adana has low popularity. Adana has low season...   \n",
+       "1    Coimbra has medium popularity and medium budge...   \n",
+       "2    Zagreb has high popularity and low budget. Zag...   \n",
+       "3    Van has low popularity. Van has low season in ...   \n",
+       "4    Aalborg has medium popularity and high budget....   \n",
+       "..                                                 ...   \n",
+       "195  Zaragoza has medium popularity. In Zaragoza yo...   \n",
+       "196  Sarajevo has high popularity and medium budget...   \n",
+       "197  Malatya has low popularity and high budget. Ma...   \n",
+       "198  Chelyabinsk has medium popularity , low budget...   \n",
+       "199  Belgrade has high popularity and medium budget...   \n",
+       "\n",
+       "                                                  city  \\\n",
+       "0    ['Adana', 'Adiyaman', 'Agri', 'Arad', 'Arkhang...   \n",
+       "1                         ['Coimbra', 'Brno', 'Braga']   \n",
+       "2    ['Zagreb', 'Volgograd', 'Tirana', 'Tbilisi', '...   \n",
+       "3    ['Van', 'Uzhhorod', 'Trabzon', 'Thessaloniki',...   \n",
+       "4    ['Aalborg', 'Astrakhan', 'Bari', 'Bremen', 'Ch...   \n",
+       "..                                                 ...   \n",
+       "195  ['Zaragoza', 'Varna', 'Turku', 'Tampere', 'Szc...   \n",
+       "196  ['Sarajevo', 'Tallinn', 'Vilnius', 'Belgrade',...   \n",
+       "197                            ['Malatya', 'Ioannina']   \n",
+       "198  ['Chelyabinsk', 'Kirov', 'Podgorica', 'Rijeka'...   \n",
+       "199  ['Belgrade', 'Bratislava', 'Budapest', 'Nicosi...   \n",
+       "\n",
+       "                                        gemini_query_v  \\\n",
+       "0             Cheap European city break in February.\\n   \n",
+       "1    Medium budget European city break with parks a...   \n",
+       "2    Cheap January city break in Europe with museum...   \n",
+       "3    Cheap European city break in January with inte...   \n",
+       "4    Suggest some moderately popular European citie...   \n",
+       "..                                                 ...   \n",
+       "195           Good places to swim outdoors in Europe\\n   \n",
+       "196  Medium budget European city break in April wit...   \n",
+       "197  High-budget European city trip in February wit...   \n",
+       "198  Suggest a low-budget, walkable European city b...   \n",
+       "199  Popular and affordable European city break des...   \n",
+       "\n",
+       "                                       gemini_query_p0  \\\n",
+       "0    European city break in February, less crowded ...   \n",
+       "1    European city break, medium budget, good parks...   \n",
+       "2    European city break in January. Budget friendl...   \n",
+       "3    European city break in January. Low-budget des...   \n",
+       "4    High-budget European city with equestrian attr...   \n",
+       "..                                                 ...   \n",
+       "195  Good places for a Flash developer to visit in ...   \n",
+       "196  Budget-friendly European city break in April w...   \n",
+       "197  European city break in February. Low season & ...   \n",
+       "198  Budget-friendly European city break in April, ...   \n",
+       "199  Affordable, popular European capitals for a we...   \n",
+       "\n",
+       "                                       gemini_query_p1  \\\n",
+       "0    Best European cities for intense physical trai...   \n",
+       "1    Best European cities for live music, especiall...   \n",
+       "2    Where can I find inspiring European cities wit...   \n",
+       "3    Best European cities for unique, artistic expe...   \n",
+       "4    European cities with renowned veterinary or ag...   \n",
+       "..                                                 ...   \n",
+       "195  Best European cities for tech meetups & cowork...   \n",
+       "196  European cities with a grand, futuristic feel ...   \n",
+       "197  Where can I find European cities rich in histo...   \n",
+       "198  Which European cities offer glimpses into the ...   \n",
+       "199  Affordable, safe European cities with historic...   \n",
+       "\n",
+       "                                         llama_query_v  \\\n",
+       "0    \"Less crowded European cities to visit in Febr...   \n",
+       "1    'medium budget European city breaks with parks...   \n",
+       "2    \"Looking for a popular and affordable European...   \n",
+       "3    \"European cities with low popularity, monaster...   \n",
+       "4              \"European cities for a luxurious trip.\"   \n",
+       "..                                                 ...   \n",
+       "195  \"European cities with medium popularity for ou...   \n",
+       "196  'medium budget trip in April to a popular Euro...   \n",
+       "197  \"Less crowded European destinations with water...   \n",
+       "198  \"European cities with great walkability and lo...   \n",
+       "199  'medium budget european city breaks in popular...   \n",
+       "\n",
+       "                                        llama_query_p0  \\\n",
+       "0    \"European cities with ice hockey facilities, l...   \n",
+       "1    \"Medium budget European cities with parks and ...   \n",
+       "2    \"Low-budget European cities with museums and n...   \n",
+       "3    \"off the beaten path European city breaks in l...   \n",
+       "4    \"European cities with horse riding trails and ...   \n",
+       "..                                                 ...   \n",
+       "195  A junior Flash developer seeking guidance on c...   \n",
+       "196  \"Medium budget trip to a popular European city...   \n",
+       "197  \"Less crowded European destinations for a pric...   \n",
+       "198  \"European cities with industrial heritage site...   \n",
+       "199  \"Medium budget city breaks in Europe for a sch...   \n",
+       "\n",
+       "                                        llama_query_p1  \n",
+       "0    Based on the user's profile as a top-scoring p...  \n",
+       "1    Based on the user's background as a former DJ ...  \n",
+       "2    Based on the provided information, I'm going t...  \n",
+       "3    Based on the given information, I'll create a ...  \n",
+       "4    Based on the user's background and interests, ...  \n",
+       "..                                                 ...  \n",
+       "195  Which European cities offer a mix of cultural ...  \n",
+       "196  Based on the user's interest in Sins of a Sola...  \n",
+       "197  Based on the provided information, I would gue...  \n",
+       "198  Based on the user's interest in technological ...  \n",
+       "199  Based on the information provided, I'll make a...  \n",
+       "\n",
+       "[200 rows x 12 columns]"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "merged = pd.merge(gemini, llama, on=common_cols, how=\"right\")\n",
+    "print(merged.shape)\n",
+    "merged"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "ed6dca09",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "config_id          0\n",
+       "persona_id         0\n",
+       "persona            0\n",
+       "filters            0\n",
+       "context            0\n",
+       "city               0\n",
+       "gemini_query_v     0\n",
+       "gemini_query_p0    0\n",
+       "gemini_query_p1    0\n",
+       "llama_query_v      0\n",
+       "llama_query_p0     0\n",
+       "llama_query_p1     0\n",
+       "dtype: int64"
+      ]
+     },
+     "execution_count": 11,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "merged.isna().sum()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "id": "9693f553",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "merged.to_csv(\"../../data/user-evaluation/merged.csv\", index=False)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "93dba3ec",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".crs-venv",
+   "language": "python",
+   "name": ".crs-venv"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.15"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}

views/questions_screen.py CHANGED Viewed

@@ -4,7 +4,7 @@ from datetime import datetime
 import os
 from dotenv import load_dotenv
 from views.nav_buttons import navigation_buttons
 load_dotenv()
@@ -80,11 +80,11 @@ def questions_screen(data):
             st.text_area("", config['context'], height=300, disabled=False)
         # Render queries and collect ratings
-        query_v_ratings = render_query_ratings("Query_v", config, "query_v", current_index)
         query_p0_ratings = render_query_ratings("Query_p0",
-                                                config, "query_p0", current_index, has_persona_alignment=True)
         query_p1_ratings = render_query_ratings("Query_p1",
-                                                config, "query_p1",
                                                 current_index, has_persona_alignment=True)
         # Additional comments

 import os
 from dotenv import load_dotenv
 from views.nav_buttons import navigation_buttons
+st.set_page_config(layout="wide")
 load_dotenv()
             st.text_area("", config['context'], height=300, disabled=False)
         # Render queries and collect ratings
+        query_v_ratings = render_query_ratings("Query_v", config, "gemini_query_v", current_index)
         query_p0_ratings = render_query_ratings("Query_p0",
+                                                config, "gemini_query_p0", current_index, has_persona_alignment=True)
         query_p1_ratings = render_query_ratings("Query_p1",
+                                                config, "gemini_query_p1",
                                                 current_index, has_persona_alignment=True)
         # Additional comments