mirror of
https://github.com/Significant-Gravitas/AutoGPT.git
synced 2026-01-09 15:17:59 -05:00
Make agbenchmark a Proxy of the evaluated agent Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com>
33 lines
1.1 KiB
JSON
33 lines
1.1 KiB
JSON
{
|
|
"name": "ThreeSum",
|
|
"category": [
|
|
"coding",
|
|
"iterate"
|
|
],
|
|
"task": "Create a three_sum function in a file called sample_code.py. Given an array of integers, return indices of the three numbers such that they add up to a specific target. You may assume that each input would have exactly one solution, and you may not use the same element twice. Example: Given nums = [2, 7, 11, 15], target = 20, Because nums[0] + nums[1] + nums[2] = 2 + 7 + 11 = 20, return [0, 1, 2].",
|
|
"dependencies": [
|
|
"FunctionCodeGeneration"
|
|
],
|
|
"cutoff": 60,
|
|
"ground": {
|
|
"answer": "The three_sum function coded properly.",
|
|
"should_contain": [
|
|
"[0, 1, 2]",
|
|
"[0, 2, 5]",
|
|
"[0, 2, 3]"
|
|
],
|
|
"should_not_contain": [],
|
|
"files": [
|
|
"test.py"
|
|
],
|
|
"eval": {
|
|
"type": "python"
|
|
}
|
|
},
|
|
"info": {
|
|
"difficulty": "basic",
|
|
"description": "s ability for the agent to create the three_sum function.",
|
|
"side_effects": []
|
|
},
|
|
"eval_id": "ceb2ebfd-45da-40a4-92e9-909dedb23352"
|
|
} |