Aman-J's picture
fix decimals
1eeaad6
raw
history blame
430 Bytes
[
{
"agent_name": "GenericAgent-GPT-5",
"study_id": "2025-08-07_21-09-16",
"benchmark": "WorkArena-L1",
"score": 79.1,
"std_err": 2.2,
"benchmark_specific": "No",
"benchmark_tuned": "No",
"followed_evaluation_protocol": "No",
"reproducible": "Yes",
"comments": "Increased max_steps from 15 to 30",
"original_or_reproduced": "Original",
"date_time": "2025-08-07 21:09:16"
}
]