leaderboard-hackaton-2025

Running

App Files Files Community

ouhenio commited on 4 days ago

Commit

2b70f36

verified ·

1 Parent(s): 1596d90

Update app.py

Browse files

Files changed (1) hide show

app.py +62 -3

app.py CHANGED Viewed

@@ -221,6 +221,59 @@ def get_estereotipos_data(username_mapping):
     return result
 @lru_cache(maxsize=32)
 def get_user_contributions_cached(cache_buster: int):
     return consolidate_all_data()
@@ -231,8 +284,9 @@ def consolidate_all_data():
     blend_es_data, username_mapping = get_blend_es_data()
     include_data = get_include_data(username_mapping)
     estereotipos_data = get_estereotipos_data(username_mapping)
-    all_user_ids = set(blend_es_data.keys()) | set(include_data.keys()) | set(estereotipos_data.keys())
     rows = []
     for user_id in all_user_ids:
@@ -245,6 +299,7 @@ def consolidate_all_data():
         include_value = include_data.get(user_id, 0)
         estereotipos_value = estereotipos_data.get(user_id, 0)
         if isinstance(user_id, str):
             if user_id.startswith("discord_"):
@@ -253,13 +308,17 @@ def consolidate_all_data():
             elif user_id.startswith("estereotipos_"):
                 username = user_id.replace("estereotipos_", "")
                 blend_es_value = 0
         row = {
             "Username": username,
-            "Total": blend_es_value + include_value + estereotipos_value,
             "Blend-es": blend_es_value,
             "INCLUDE": include_value,
-            "Estereotipos": estereotipos_value
         }
         rows.append(row)

     return result
+def get_arena_data(username_mapping):
+    result = defaultdict(int)
+    try:
+        mail_to_discord = {}
+        if os.path.exists("mail_to_username.csv"):
+            mapping_df = pd.read_csv("mail_to_username.csv")
+            if "gmail" in mapping_df.columns and "discord" in mapping_df.columns:
+                for _, row in mapping_df.iterrows():
+                    mail = row["gmail"]
+                    discord = row["discord"]
+                    if pd.notna(mail) and pd.notna(discord):
+                        mail_to_discord[mail.lower()] = discord.lower()
+        if os.path.exists("arena.json"):
+            import json
+            with open("arena.json", "r", encoding="utf-8") as f:
+                arena_data = json.load(f)
+            mail_counts = defaultdict(int)
+            for country, conversations in arena_data.items():
+                for conversation in conversations:
+                    if "username" in conversation:
+                        mail = conversation["username"]
+                        if mail:
+                            mail_counts[mail.lower()] += 1
+            reverse_mapping = {}
+            for user_id, username in username_mapping.items():
+                reverse_mapping[username.lower()] = user_id
+            for mail, count in mail_counts.items():
+                discord_name = mail_to_discord.get(mail, "")
+                if discord_name:
+                    matched = False
+                    for argilla_name in reverse_mapping:
+                        if discord_name in argilla_name or argilla_name in discord_name:
+                            user_id = reverse_mapping[argilla_name]
+                            result[user_id] += count
+                            matched = True
+                            break
+                    if not matched:
+                        result[f"arena_{discord_name}"] = count
+                else:
+                    # Use just the username portion of the email (before the @)
+                    username_part = mail.split('@')[0] if '@' in mail else mail
+                    result[f"arena_{username_part}"] = count
+    except Exception as e:
+        print(f"Error loading arena data: {e}")
+    return result
 @lru_cache(maxsize=32)
 def get_user_contributions_cached(cache_buster: int):
     return consolidate_all_data()
     blend_es_data, username_mapping = get_blend_es_data()
     include_data = get_include_data(username_mapping)
     estereotipos_data = get_estereotipos_data(username_mapping)
+    arena_data = get_arena_data(username_mapping)
+    all_user_ids = set(blend_es_data.keys()) | set(include_data.keys()) | set(estereotipos_data.keys()) | set(arena_data.keys())
     rows = []
     for user_id in all_user_ids:
         include_value = include_data.get(user_id, 0)
         estereotipos_value = estereotipos_data.get(user_id, 0)
+        arena_value = arena_data.get(user_id, 0)
         if isinstance(user_id, str):
             if user_id.startswith("discord_"):
             elif user_id.startswith("estereotipos_"):
                 username = user_id.replace("estereotipos_", "")
                 blend_es_value = 0
+            elif user_id.startswith("arena_"):
+                username = user_id.replace("arena_", "")
+                blend_es_value = 0
         row = {
             "Username": username,
+            "Total": blend_es_value + include_value + estereotipos_value + arena_value,
             "Blend-es": blend_es_value,
             "INCLUDE": include_value,
+            "Estereotipos": estereotipos_value,
+            "Arena": arena_value
         }
         rows.append(row)