Spaces:

sartifyllc
/

Swahili-Text-Embeddings-Leaderboard

Running

App Files Files Community

Mollel commited on Jul 13, 2024

Commit

a323ffa

verified ·

1 Parent(s): ae12324

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -2

app.py CHANGED Viewed

@@ -21,6 +21,31 @@ def extract_table_from_markdown(markdown_text, table_start):
             table_content.append(line)
     return '\n'.join(table_content)
 def markdown_table_to_df(table_content):
     """Convert markdown table to pandas DataFrame."""
     # Split the table content into lines
@@ -33,8 +58,10 @@ def markdown_table_to_df(table_content):
     data = []
     for line in lines[2:]:  # Skip the header separator line
         row = [cell.strip() for cell in line.split('|') if cell.strip()]
-        if row and len(row) == len(headers):  # Ensure row has the correct number of columns
-            data.append(row)
     # Create DataFrame
     df = pd.DataFrame(data, columns=headers)

             table_content.append(line)
     return '\n'.join(table_content)
+# def markdown_table_to_df(table_content):
+#     """Convert markdown table to pandas DataFrame."""
+#     # Split the table content into lines
+#     lines = table_content.split('\n')
+#     # Extract headers
+#     headers = [h.strip() for h in lines[0].split('|') if h.strip()]
+#     # Extract data
+#     data = []
+#     for line in lines[2:]:  # Skip the header separator line
+#         row = [cell.strip() for cell in line.split('|') if cell.strip()]
+#         if row and len(row) == len(headers):  # Ensure row has the correct number of columns
+#             data.append(row)
+#     # Create DataFrame
+#     df = pd.DataFrame(data, columns=headers)
+#     # Convert numeric columns to float
+#     for col in df.columns:
+#         if col not in ["Model Name", "Publisher", "Open?", "Basemodel", "Matryoshka"]:
+#             df[col] = pd.to_numeric(df[col], errors='coerce')
+#     return df
 def markdown_table_to_df(table_content):
     """Convert markdown table to pandas DataFrame."""
     # Split the table content into lines
     data = []
     for line in lines[2:]:  # Skip the header separator line
         row = [cell.strip() for cell in line.split('|') if cell.strip()]
+        if row:  # Include any non-empty row
+            # Pad the row with empty strings if it's shorter than the headers
+            padded_row = row + [''] * (len(headers) - len(row))
+            data.append(padded_row[:len(headers)])  # Trim if longer than headers
     # Create DataFrame
     df = pd.DataFrame(data, columns=headers)