hmacdope commited on
Commit
2be70e9
·
1 Parent(s): cf48806

uniquify based on HF username

Browse files
Files changed (2) hide show
  1. evaluate.py +1 -0
  2. utils.py +2 -1
evaluate.py CHANGED
@@ -255,6 +255,7 @@ def _evaluate_data(filename: str, test_repo: str, split_filename: str, results_r
255
  results_df['submission_time'] = timestamp
256
  results_df['model_report'] = report
257
  results_df['anonymous'] = meta.participant.anonymous
 
258
  safe_user = _unsafify_username(username)
259
  destination_path = f"results/{safe_user}_{timestamp}_results.csv"
260
  tmp_name = None
 
255
  results_df['submission_time'] = timestamp
256
  results_df['model_report'] = report
257
  results_df['anonymous'] = meta.participant.anonymous
258
+ results_df['hf_username'] = username
259
  safe_user = _unsafify_username(username)
260
  destination_path = f"results/{safe_user}_{timestamp}_results.csv"
261
  tmp_name = None
utils.py CHANGED
@@ -28,6 +28,7 @@ def fetch_dataset_df():
28
  'submission_time': Value('string'),
29
  'model_report': Value('string'),
30
  'anonymous': Value('bool'),
 
31
  }
32
  feature_schema = Features(metric_features | other_features)
33
 
@@ -51,7 +52,7 @@ def fetch_dataset_df():
51
  # Get the most recent submission per user & endpoint
52
  latest = (
53
  df.sort_values("submission_time")
54
- .drop_duplicates(subset=["Endpoint", "user"], keep="last")
55
  .sort_values(["Endpoint", "user"])
56
  .reset_index(drop=True)
57
  )
 
28
  'submission_time': Value('string'),
29
  'model_report': Value('string'),
30
  'anonymous': Value('bool'),
31
+ 'hf_username': Value('string')
32
  }
33
  feature_schema = Features(metric_features | other_features)
34
 
 
52
  # Get the most recent submission per user & endpoint
53
  latest = (
54
  df.sort_values("submission_time")
55
+ .drop_duplicates(subset=["Endpoint", "hf_username"], keep="last") #IMPORTANT: unique on HF username not display name
56
  .sort_values(["Endpoint", "user"])
57
  .reset_index(drop=True)
58
  )