Aman-J's picture
fix decimals
1eeaad6
raw
history blame
429 Bytes
[
{
"agent_name": "GenericAgent-GPT-5",
"study_id": "2025-08-07_21-09-16",
"benchmark": "WorkArena-L3",
"score": 11.5,
"std_err": 2.1,
"benchmark_specific": "No",
"benchmark_tuned": "No",
"followed_evaluation_protocol": "No",
"reproducible": "Yes",
"comments": "Increased max_steps from 50 to 100",
"original_or_reproduced": "Original",
"date_time": "2025-08-07 21:09:16"
}
]