mirror of
https://github.com/Significant-Gravitas/AutoGPT.git
synced 2026-01-08 22:58:01 -05:00
Make agbenchmark a Proxy of the evaluated agent Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com>
30 lines
892 B
JSON
30 lines
892 B
JSON
{
|
|
"name": "RevenueRetrieval1.2",
|
|
"category": [
|
|
"retrieval"
|
|
],
|
|
"task": "Write tesla's exact revenue in 2022 into a .txt file. Use the US notation, with a precision rounded to the nearest million dollars (for instance, $31,578 billion).",
|
|
"dependencies": [
|
|
"RevenueRetrieval1.1"
|
|
],
|
|
"cutoff": 60,
|
|
"ground": {
|
|
"answer": "It was $81.462 billion in 2022. In millions the answer is 81,462.",
|
|
"should_contain": [
|
|
"81,462"
|
|
],
|
|
"should_not_contain": [],
|
|
"files": [
|
|
".txt"
|
|
],
|
|
"eval": {
|
|
"type": "file"
|
|
}
|
|
},
|
|
"info": {
|
|
"difficulty": "intermediate",
|
|
"description": "Advanced version of the r2.1 challenge that also asks for specific formatting.",
|
|
"side_effects": []
|
|
},
|
|
"eval_id": "02c4f6ec-3246-4677-afb9-c9c836fd78a6"
|
|
} |