Auto-GPT-20230801081506

This commit is contained in:
Auto-GPT-Bot
2023-08-01 08:15:06 +00:00
parent f799503105
commit a4ab5f51c9
2 changed files with 73 additions and 58 deletions

View File

@@ -0,0 +1,14 @@
{
"command": "agbenchmark start",
"completion_time": "2023-08-01-08:15",
"benchmark_start_time": "2023-08-01-08:13",
"metrics": {
"run_time": "61.37 seconds",
"highest_difficulty": "No successful tests"
},
"tests": {},
"config": {
"workspace": "auto_gpt_workspace",
"entry_path": "agbenchmark.benchmarks"
}
}

View File

@@ -1,4 +1,13 @@
{
"TestAdaptLink": [
false
],
"TestAdaptSimpleTypoWithGuidance": [
false
],
"TestAdaptTeslaRevenue": [
false
],
"TestBasicContentGen": [
false,
false
@@ -11,14 +20,38 @@
false,
false
],
"TestDebugMultipleTypo": [
false
],
"TestDebugSimpleTypoWithGuidance": [
true,
true
],
"TestDebugSimpleTypoWithoutGuidance": [
false
],
"TestFunctionCodeGeneration": [
false
],
"TestGoalDivergence": [
false,
false
],
"TestGoalLoss_Hard": [
false
],
"TestGoalLoss_Medium": [
false
],
"TestGoalLoss_Simple": [
false
],
"TestGoalLoss_advanced": [
false
],
"TestInstructionFollowing": [
false
],
"TestPlanCreation": [
true,
true
@@ -27,64 +60,10 @@
true,
true
],
"TestReturnCode_Simple": [
false,
false
],
"TestSearch": [
false,
false
],
"TestWriteFile": [
true,
true
],
"TestAdaptLink": [
false
],
"TestRevenueRetrieval_1.2": [
false
],
"TestRevenueRetrieval_1.1": [
false
],
"TestRevenueRetrieval_1.0": [
false
],
"TestReturnCode_Write": [
false
],
"TestDebugSimpleTypoWithoutGuidance": [
false
],
"TestAdaptSimpleTypoWithGuidance": [
false
],
"TestInstructionFollowing": [
false
],
"TestGoalLoss_Simple": [
false
],
"TestGoalLoss_advanced": [
false
],
"TestGoalLoss_Hard": [
false
],
"TestGoalLoss_Medium": [
false
],
"TestRememberMultipleIds": [
false
],
"TestFunctionCodeGeneration": [
false
],
"TestReturnCode_Modify": [
false
],
"TestDebugMultipleTypo": [
"TestRememberMultiplePhrasesWithNoise": [
false
],
"TestRememberMultipleWithNoise": [
@@ -93,16 +72,38 @@
"TestRetrieval3": [
false
],
"TestAdaptTeslaRevenue": [
"TestReturnCode_Modify": [
false
],
"TestThreeSum": [
"TestReturnCode_Simple": [
false,
false
],
"TestReturnCode_Tests": [
false
],
"TestRememberMultiplePhrasesWithNoise": [
"TestReturnCode_Write": [
false
],
"TestRevenueRetrieval_1.0": [
false
],
"TestRevenueRetrieval_1.1": [
false
],
"TestRevenueRetrieval_1.2": [
false
],
"TestSearch": [
false,
false
],
"TestThreeSum": [
false
],
"TestWriteFile": [
true,
true,
false
]
}