Spaces:

sartifyllc
/

Swahili-Text-Embeddings-Leaderboard

Running

App Files Files Community

Mollel commited on Jul 13, 2024

Commit

93dfa2b

verified ·

1 Parent(s): 138fae9

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -1

app.py CHANGED Viewed

@@ -49,6 +49,35 @@ def extract_table_from_markdown(markdown_text, table_start):
 #     return df
 def markdown_table_to_df(table_content):
     """Convert markdown table to pandas DataFrame."""
     # Split the table content into lines
@@ -72,7 +101,7 @@ def markdown_table_to_df(table_content):
     # Convert numeric columns to float and handle Dimension column
     for col in df.columns:
         if col == "Dimension":
-            df[col] = df[col].apply(lambda x: int(x) if x.isdigit() else "")
         elif col not in ["Model Name", "Publisher", "Open?", "Basemodel", "Matryoshka"]:
             df[col] = pd.to_numeric(df[col], errors='coerce')

 #     return df
+# def markdown_table_to_df(table_content):
+#     """Convert markdown table to pandas DataFrame."""
+#     # Split the table content into lines
+#     lines = table_content.split('\n')
+#     # Extract headers
+#     headers = [h.strip() for h in lines[0].split('|') if h.strip()]
+#     # Extract data
+#     data = []
+#     for line in lines[2:]:  # Skip the header separator line
+#         row = [cell.strip() for cell in line.split('|') if cell.strip()]
+#         if row:  # Include any non-empty row
+#             # Pad the row with empty strings if it's shorter than the headers
+#             padded_row = row + [''] * (len(headers) - len(row))
+#             data.append(padded_row[:len(headers)])  # Trim if longer than headers
+#     # Create DataFrame
+#     df = pd.DataFrame(data, columns=headers)
+#     # Convert numeric columns to float and handle Dimension column
+#     for col in df.columns:
+#         if col == "Dimension":
+#             df[col] = df[col].apply(lambda x: int(x) if x.isdigit() else "")
+#         elif col not in ["Model Name", "Publisher", "Open?", "Basemodel", "Matryoshka"]:
+#             df[col] = pd.to_numeric(df[col], errors='coerce')
+#     return df
 def markdown_table_to_df(table_content):
     """Convert markdown table to pandas DataFrame."""
     # Split the table content into lines
     # Convert numeric columns to float and handle Dimension column
     for col in df.columns:
         if col == "Dimension":
+            df[col] = df[col].apply(lambda x: int(x) if x.isdigit() else None)
         elif col not in ["Model Name", "Publisher", "Open?", "Basemodel", "Matryoshka"]:
             df[col] = pd.to_numeric(df[col], errors='coerce')