fzoll commited on
Commit
2a09920
·
1 Parent(s): 5fc7ea7
Files changed (1) hide show
  1. app/backend/data_engine.py +16 -2
app/backend/data_engine.py CHANGED
@@ -113,6 +113,15 @@ class DataEngine:
113
  for _, row in grouped_dataset_count.iterrows():
114
  dataset_num_map[row["group_name"]] = row["dataset_name"]
115
 
 
 
 
 
 
 
 
 
 
116
  grouped_model = df.groupby(["model_name", "group_name"]).agg({
117
  "ndcg_at_10": "mean",
118
  }).reset_index()
@@ -121,13 +130,18 @@ class DataEngine:
121
 
122
  # Rename columns
123
  pivot.columns = list(
124
- map(lambda x: f"{x[1].capitalize()} Average ({dataset_num_map[x[1]]} datasets)" if x[
125
- 1] != 'text' else f"Average ({dataset_num_map[x[1]]} datasets)",
126
  pivot.columns))
127
 
128
  pivot_dataset = df_result.pivot(index="model_name", columns="dataset_name", values="ndcg_at_10")
129
 
 
 
 
 
 
130
  df = pd.merge(df_model, pivot, on="model_name")
 
131
  df = pd.merge(df, pivot_dataset, on="model_name")
132
 
133
  if df.empty:
 
113
  for _, row in grouped_dataset_count.iterrows():
114
  dataset_num_map[row["group_name"]] = row["dataset_name"]
115
 
116
+ # Create a list of open datasets
117
+ open_datasets = []
118
+ for result in results_list:
119
+ if not result.get("is_closed", False):
120
+ open_datasets.append(result["dataset_name"])
121
+
122
+ # Count open datasets
123
+ open_dataset_count = len(open_datasets)
124
+
125
  grouped_model = df.groupby(["model_name", "group_name"]).agg({
126
  "ndcg_at_10": "mean",
127
  }).reset_index()
 
130
 
131
  # Rename columns
132
  pivot.columns = list(
133
+ map(lambda x: f"{x[1].capitalize()} Average ({dataset_num_map[x[1]]} datasets)" if x[1] != 'text' else f"Average ({dataset_num_map[x[1]]} datasets)",
 
134
  pivot.columns))
135
 
136
  pivot_dataset = df_result.pivot(index="model_name", columns="dataset_name", values="ndcg_at_10")
137
 
138
+ # Calculate open average
139
+ open_df = df_result[df_result["dataset_name"].isin(open_datasets)]
140
+ open_avg = open_df.groupby("model_name")["ndcg_at_10"].mean().reset_index()
141
+ open_avg = open_avg.rename(columns={"ndcg_at_10": f"Open average ({open_dataset_count} datasets)"})
142
+
143
  df = pd.merge(df_model, pivot, on="model_name")
144
+ df = pd.merge(df, open_avg, on="model_name")
145
  df = pd.merge(df, pivot_dataset, on="model_name")
146
 
147
  if df.empty: