[ | |
{ | |
"agent_name": "GenericAgent-AgentTrek-1.0-32b", | |
"study_id": "ed14232c-cd7e-4708-b334-ebaf1f220000", | |
"date_time": "2025-01-12 00:37:04", | |
"benchmark": "WorkArena-L1", | |
"score": 38.29, | |
"std_err": 2.70, | |
"benchmark_specific": "No", | |
"benchmark_tuned": "No", | |
"followed_evaluation_protocol": "Yes", | |
"reproducible": "Yes", | |
"comments": "Additional details", | |
"original_or_reproduced": "Original" | |
} | |
] |