Spaces:

avid-ml
/

biasaware

Sleeping

App Files Files Community

freyam commited on Sep 30, 2023

Commit

1869ec4

1 Parent(s): de10a36

Add 1000 db

Browse files

Files changed (7) hide show

app.py +11 -9
data/amazon_1000.csv +0 -0
data/imdb_100.csv +0 -0
data/imdb_1000.csv +0 -0
data/twitter_1000.csv +0 -0
data/z_employee.csv +0 -26
data/z_sentences.csv +0 -11

app.py CHANGED Viewed

@@ -9,6 +9,12 @@ from scripts.gender_distribution import *
 methodologies = json.load(open("config/methodologies.json", "r"))
 MAX_THRESHOLD = 5000
 DATASET_CACHE = {}
@@ -16,7 +22,7 @@ DATASET_CACHE = {}
 def evaluate(dataset, sampling_method, sampling_size, column, methodology):
     try:
         print(
-            f"[{dataset.name.split('/')[-1]}::{column}] - {sampling_method} {sampling_size} entries"
         )
         data = DATASET_CACHE.setdefault(dataset.name, pd.read_csv(dataset.name))[
             [column]
@@ -125,16 +131,12 @@ with BiasAware:
     )
     with gr.Row():
-        with gr.Column(scale=2):
             gr.Markdown("## Dataset")
             dataset_file = gr.File(label="Dataset", file_types=["csv"])
             dataset_examples = gr.Examples(
-                [
-                    os.path.join(os.path.dirname(__file__), "data/imdb_100.csv"),
-                    os.path.join(os.path.dirname(__file__), "data/z_employee.csv"),
-                    os.path.join(os.path.dirname(__file__), "data/z_sentences.csv"),
-                ],
                 inputs=dataset_file,
                 label="Example Datasets",
             )
@@ -147,7 +149,7 @@ with BiasAware:
                 row_count=(5, "fixed"), col_count=(1, "fixed"), visible=False
             )
-        with gr.Column(scale=2):
             gr.Markdown("## Methodology")
             methodology = gr.Radio(
@@ -160,7 +162,7 @@ with BiasAware:
             methodology_metadata = gr.Markdown(visible=False)
-        with gr.Column(scale=4):
             result = gr.Markdown("## Result")
             result_plot = gr.Plot(show_label=False, container=False, visible=False)

 methodologies = json.load(open("config/methodologies.json", "r"))
+datasets = [
+    os.path.join(os.path.dirname(__file__), "data", f)
+    for f in os.listdir(os.path.join(os.path.dirname(__file__), "data"))
+    if f.endswith(".csv")
+]
 MAX_THRESHOLD = 5000
 DATASET_CACHE = {}
 def evaluate(dataset, sampling_method, sampling_size, column, methodology):
     try:
         print(
+            f"[{dataset.name.split('/')[-1]}::{column}] - {sampling_method} {sampling_size} entries using {methodology}"
         )
         data = DATASET_CACHE.setdefault(dataset.name, pd.read_csv(dataset.name))[
             [column]
     )
     with gr.Row():
+        with gr.Column(scale=1):
             gr.Markdown("## Dataset")
             dataset_file = gr.File(label="Dataset", file_types=["csv"])
             dataset_examples = gr.Examples(
+                examples=datasets,
                 inputs=dataset_file,
                 label="Example Datasets",
             )
                 row_count=(5, "fixed"), col_count=(1, "fixed"), visible=False
             )
+        with gr.Column(scale=1):
             gr.Markdown("## Methodology")
             methodology = gr.Radio(
             methodology_metadata = gr.Markdown(visible=False)
+        with gr.Column(scale=2):
             result = gr.Markdown("## Result")
             result_plot = gr.Plot(show_label=False, container=False, visible=False)

data/amazon_1000.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/imdb_100.csv DELETED Viewed

The diff for this file is too large to render. See raw diff

data/imdb_1000.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/twitter_1000.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data/z_employee.csv DELETED Viewed

@@ -1,26 +0,0 @@
-EmployeeID,FirstName,LastName,Email,Department,Salary
-101,John,Smith,[email protected],Finance,60000
-102,Emily,Johnson,[email protected],Marketing,55000
-103,Michael,Williams,[email protected],HR,50000
-104,Susan,Anderson,[email protected],IT,65000
-105,David,Martin,[email protected],Sales,58000
-106,Linda,Davis,[email protected],Finance,62000
-107,William,Miller,[email protected],Marketing,56000
-108,Sarah,Anderson,[email protected],HR,51000
-109,Robert,Clark,[email protected],IT,67000
-110,Karen,Wilson,[email protected],Sales,59000
-111,James,Brown,[email protected],Finance,61000
-112,Anna,Johnson,[email protected],Marketing,57000
-113,Christopher,Moore,[email protected],HR,52000
-114,Laura,White,[email protected],IT,68000
-115,Mark,Davis,[email protected],Sales,60000
-116,Patricia,Jones,[email protected],Finance,63000
-117,Matthew,Taylor,[email protected],Marketing,58000
-118,Jennifer,Young,[email protected],HR,53000
-119,Steven,Anderson,[email protected],IT,69000
-120,Elizabeth,Thomas,[email protected],Sales,61000
-121,Kevin,Harris,[email protected],Finance,64000
-122,Deborah,Smith,[email protected],Marketing,59000
-123,Joseph,Walker,[email protected],HR,54000
-124,Cynthia,Jackson,[email protected],IT,70000
-125,Daniel,Hall,[email protected],Sales,62000

data/z_sentences.csv DELETED Viewed

@@ -1,11 +0,0 @@
-ID,Sentences,Gender Bias Test
-1,The doctor examined the patient.,Neutral
-2,The teacher helped the student with their homework.,Neutral
-3,The engineer designed the new software.,Neutral
-4,The nurse cared for the sick child.,Neutral
-5,The chef prepared a delicious meal.,Neutral
-6,The firefighter bravely rescued people from the burning building.,Neutral
-7,The police officer maintained law and order in the city.,Neutral
-8,The scientist conducted groundbreaking research.,Neutral
-9,The artist created a beautiful masterpiece.,Neutral
-10,The CEO made important decisions for the company.,Neutral