gpt-engineer-20230801081428

pull/5155/head
Auto-GPT-Bot 2023-08-01 08:14:28 +00:00
parent f0615f77ec
commit 2cd4ffcd90
3 changed files with 72 additions and 52 deletions

View File

@ -0,0 +1,14 @@
{
"command": "agbenchmark start",
"completion_time": "2023-08-01-08:14",
"benchmark_start_time": "2023-08-01-08:13",
"metrics": {
"run_time": "62.54 seconds",
"highest_difficulty": "No successful tests"
},
"tests": {},
"config": {
"workspace": "projects/my-new-project/workspace",
"entry_path": "agbenchmark.benchmarks"
}
}

View File

@ -1 +1,6 @@
{}
{
"TestWriteFile": {
"difficulty": "interface",
"data_path": "agbenchmark/challenges/interface/write_file/data.json"
}
}

View File

@ -3,6 +3,12 @@
false,
false
],
"TestAdaptSimpleTypoWithGuidance": [
false
],
"TestAdaptTeslaRevenue": [
false
],
"TestBasicContentGen": [
false,
false
@ -15,14 +21,38 @@
false,
false
],
"TestDebugMultipleTypo": [
false
],
"TestDebugSimpleTypoWithGuidance": [
false,
false
],
"TestDebugSimpleTypoWithoutGuidance": [
false
],
"TestFunctionCodeGeneration": [
false
],
"TestGoalDivergence": [
false,
false
],
"TestGoalLoss_Hard": [
false
],
"TestGoalLoss_Medium": [
false
],
"TestGoalLoss_Simple": [
false
],
"TestGoalLoss_advanced": [
false
],
"TestInstructionFollowing": [
false
],
"TestPlanCreation": [
false,
true
@ -31,10 +61,28 @@
false,
false
],
"TestRememberMultipleIds": [
false
],
"TestRememberMultiplePhrasesWithNoise": [
false
],
"TestRememberMultipleWithNoise": [
false
],
"TestRetrieval3": [
false
],
"TestReturnCode_Modify": [
false
],
"TestReturnCode_Simple": [
false,
false
],
"TestReturnCode_Tests": [
false
],
"TestReturnCode_Write": [
false,
false
@ -55,59 +103,12 @@
false,
false
],
"TestWriteFile": [
true,
true
],
"TestDebugSimpleTypoWithoutGuidance": [
false
],
"TestAdaptSimpleTypoWithGuidance": [
false
],
"TestInstructionFollowing": [
false
],
"TestGoalLoss_Simple": [
false
],
"TestGoalLoss_advanced": [
false
],
"TestGoalLoss_Hard": [
false
],
"TestGoalLoss_Medium": [
false
],
"TestRememberMultipleIds": [
false
],
"TestFunctionCodeGeneration": [
false
],
"TestReturnCode_Modify": [
false
],
"TestDebugMultipleTypo": [
false
],
"TestRememberMultipleWithNoise": [
false
],
"TestRetrieval3": [
false
],
"TestAdaptTeslaRevenue": [
false
],
"TestThreeSum": [
false
],
"TestReturnCode_Tests": [
false
],
"TestRememberMultiplePhrasesWithNoise": [
false
"TestWriteFile": [
true,
true,
true
]
}