sh1gechan commited on
Commit
c445cd9
·
verified ·
1 Parent(s): 96fd777

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +20 -21
app.py CHANGED
@@ -142,46 +142,45 @@ def filter_queries(query: str, filtered_df: pd.DataFrame):
142
 
143
 
144
  def filter_models(
145
- df: pd.DataFrame, type_query: list, size_query: list, precision_query: list,
146
- add_special_tokens_query: list, num_few_shots_query: list, show_deleted: bool,
147
- show_merges: bool, show_flagged: bool, shown_columns: list
148
  ) -> pd.DataFrame:
149
  print(f"Initial df shape: {df.shape}")
150
-
 
151
  filtered_df = df
152
 
153
- if 'T' in shown_columns:
154
- type_emoji = [t.split()[0] for t in type_query]
155
- filtered_df = filtered_df[filtered_df['T'].isin(type_emoji)]
156
  print(f"After type filter: {filtered_df.shape}")
157
 
158
- if 'Precision' in shown_columns:
159
- filtered_df = filtered_df[filtered_df['Precision'].isin(precision_query + ['Unknown', '?'])]
160
  print(f"After precision filter: {filtered_df.shape}")
161
 
162
- if '#Params (B)' in shown_columns:
163
- if 'Unknown' in size_query:
164
- size_mask = filtered_df['#Params (B)'].isna() | (filtered_df['#Params (B)'] == 0)
165
- else:
166
- size_mask = filtered_df['#Params (B)'].apply(lambda x: any(pd.Interval(NUMERIC_INTERVALS[s].left, NUMERIC_INTERVALS[s].right).contains(x) for s in size_query if s != 'Unknown'))
167
- filtered_df = filtered_df[size_mask]
168
  print(f"After size filter: {filtered_df.shape}")
169
 
170
- if 'Add Special Tokens' in shown_columns:
171
- filtered_df = filtered_df[filtered_df['Add Special Tokens'].isin(add_special_tokens_query + ['Unknown', '?'])]
172
  print(f"After add_special_tokens filter: {filtered_df.shape}")
173
 
174
- if 'Few-shot' in shown_columns:
175
- filtered_df = filtered_df[filtered_df['Few-shot'].astype(str).isin([str(x) for x in num_few_shots_query] + ['Unknown', '?'])]
176
  print(f"After num_few_shots filter: {filtered_df.shape}")
177
 
178
- if not show_deleted and 'Available on the hub' in shown_columns:
 
179
  filtered_df = filtered_df[filtered_df['Available on the hub'] == True]
180
  print(f"After show_deleted filter: {filtered_df.shape}")
181
 
182
  print("Filtered dataframe head:")
183
  print(filtered_df.head())
184
-
185
  return filtered_df
186
 
187
  leaderboard_df = filter_models(leaderboard_df, [t.to_str(" : ") for t in ModelType], list(NUMERIC_INTERVALS.keys()), [i.value.name for i in Precision], [i.value.name for i in AddSpecialTokens], [i.value.name for i in NumFewShots], False, False, False)
 
142
 
143
 
144
  def filter_models(
145
+ df: pd.DataFrame, type_query: list, size_query: list, precision_query: list, add_special_tokens_query: list, num_few_shots_query: list, show_deleted: bool, show_merges: bool, show_flagged: bool
 
 
146
  ) -> pd.DataFrame:
147
  print(f"Initial df shape: {df.shape}")
148
+ print(f"Initial df content:\n{df}")
149
+
150
  filtered_df = df
151
 
152
+ # Model Type フィルタリング
153
+ type_emoji = [t.split()[0] for t in type_query]
154
+ filtered_df = filtered_df[filtered_df['T'].isin(type_emoji)]
155
  print(f"After type filter: {filtered_df.shape}")
156
 
157
+ # Precision フィルタリング
158
+ filtered_df = filtered_df[filtered_df['Precision'].isin(precision_query + ['Unknown', '?'])]
159
  print(f"After precision filter: {filtered_df.shape}")
160
 
161
+ # Model Size フィルタリング
162
+ if 'Unknown' in size_query:
163
+ size_mask = filtered_df['#Params (B)'].isna() | (filtered_df['#Params (B)'] == 0)
164
+ else:
165
+ size_mask = filtered_df['#Params (B)'].apply(lambda x: any(x in NUMERIC_INTERVALS[s] for s in size_query if s != 'Unknown'))
166
+ filtered_df = filtered_df[size_mask]
167
  print(f"After size filter: {filtered_df.shape}")
168
 
169
+ # Add Special Tokens フィルタリング
170
+ filtered_df = filtered_df[filtered_df['Add Special Tokens'].isin(add_special_tokens_query + ['Unknown', '?'])]
171
  print(f"After add_special_tokens filter: {filtered_df.shape}")
172
 
173
+ # Num Few Shots フィルタリング
174
+ filtered_df = filtered_df[filtered_df['Few-shot'].astype(str).isin([str(x) for x in num_few_shots_query] + ['Unknown', '?'])]
175
  print(f"After num_few_shots filter: {filtered_df.shape}")
176
 
177
+ # Show deleted models フィルタリング
178
+ if not show_deleted:
179
  filtered_df = filtered_df[filtered_df['Available on the hub'] == True]
180
  print(f"After show_deleted filter: {filtered_df.shape}")
181
 
182
  print("Filtered dataframe head:")
183
  print(filtered_df.head())
 
184
  return filtered_df
185
 
186
  leaderboard_df = filter_models(leaderboard_df, [t.to_str(" : ") for t in ModelType], list(NUMERIC_INTERVALS.keys()), [i.value.name for i in Precision], [i.value.name for i in AddSpecialTokens], [i.value.name for i in NumFewShots], False, False, False)