uniquify based on HF username
Browse files- evaluate.py +1 -0
- utils.py +2 -1
evaluate.py
CHANGED
|
@@ -255,6 +255,7 @@ def _evaluate_data(filename: str, test_repo: str, split_filename: str, results_r
|
|
| 255 |
results_df['submission_time'] = timestamp
|
| 256 |
results_df['model_report'] = report
|
| 257 |
results_df['anonymous'] = meta.participant.anonymous
|
|
|
|
| 258 |
safe_user = _unsafify_username(username)
|
| 259 |
destination_path = f"results/{safe_user}_{timestamp}_results.csv"
|
| 260 |
tmp_name = None
|
|
|
|
| 255 |
results_df['submission_time'] = timestamp
|
| 256 |
results_df['model_report'] = report
|
| 257 |
results_df['anonymous'] = meta.participant.anonymous
|
| 258 |
+
results_df['hf_username'] = username
|
| 259 |
safe_user = _unsafify_username(username)
|
| 260 |
destination_path = f"results/{safe_user}_{timestamp}_results.csv"
|
| 261 |
tmp_name = None
|
utils.py
CHANGED
|
@@ -28,6 +28,7 @@ def fetch_dataset_df():
|
|
| 28 |
'submission_time': Value('string'),
|
| 29 |
'model_report': Value('string'),
|
| 30 |
'anonymous': Value('bool'),
|
|
|
|
| 31 |
}
|
| 32 |
feature_schema = Features(metric_features | other_features)
|
| 33 |
|
|
@@ -51,7 +52,7 @@ def fetch_dataset_df():
|
|
| 51 |
# Get the most recent submission per user & endpoint
|
| 52 |
latest = (
|
| 53 |
df.sort_values("submission_time")
|
| 54 |
-
.drop_duplicates(subset=["Endpoint", "
|
| 55 |
.sort_values(["Endpoint", "user"])
|
| 56 |
.reset_index(drop=True)
|
| 57 |
)
|
|
|
|
| 28 |
'submission_time': Value('string'),
|
| 29 |
'model_report': Value('string'),
|
| 30 |
'anonymous': Value('bool'),
|
| 31 |
+
'hf_username': Value('string')
|
| 32 |
}
|
| 33 |
feature_schema = Features(metric_features | other_features)
|
| 34 |
|
|
|
|
| 52 |
# Get the most recent submission per user & endpoint
|
| 53 |
latest = (
|
| 54 |
df.sort_values("submission_time")
|
| 55 |
+
.drop_duplicates(subset=["Endpoint", "hf_username"], keep="last") #IMPORTANT: unique on HF username not display name
|
| 56 |
.sort_values(["Endpoint", "user"])
|
| 57 |
.reset_index(drop=True)
|
| 58 |
)
|