AutoGPT/agbenchmark/regression_tests.json

99 lines
2.6 KiB
JSON
Raw Normal View History

{
"TestReadFile": {
2023-07-06 03:32:28 +00:00
"difficulty": "basic",
"dependencies": [
"TestWriteFile"
],
"test": "agbenchmark/challenges/interface/read_file",
"success": true
},
"TestBasicMemory": {
2023-07-10 00:27:21 +00:00
"difficulty": "basic",
"dependencies": [
2023-07-10 00:27:21 +00:00
"TestReadFile",
"TestWriteFile"
],
"test": "agbenchmark/challenges/memory/m1",
"success": true
},
"TestBasicRetrieval": {
"difficulty": "basic",
"dependencies": [
"TestWriteFile",
"TestSearch"
],
"test": "agbenchmark/challenges/retrieval/r1",
"success": true
},
"TestRememberMultipleIds": {
2023-07-10 00:27:21 +00:00
"difficulty": "basic",
"dependencies": [
"TestBasicMemory"
],
"test": "agbenchmark/challenges/memory/m2",
"success": true
},
"TestRetrieval2": {
"difficulty": "basic",
2023-07-10 00:27:21 +00:00
"dependencies": [
"TestBasicRetrieval"
2023-07-10 00:27:21 +00:00
],
"test": "agbenchmark/challenges/retrieval/r2",
"success": true
},
"TestRememberMultipleIdsWithNoise": {
"difficulty": "medium",
"dependencies": [
"TestRememberMultipleIds"
2023-07-10 00:27:21 +00:00
],
"test": "agbenchmark/challenges/memory/m3",
"success": true
2023-07-10 00:27:21 +00:00
},
"TestRetrieval3": {
"difficulty": "basic",
2023-07-10 00:27:21 +00:00
"dependencies": [
"TestRetrieval2"
],
"test": "agbenchmark/challenges/retrieval/r3",
"success": true
2023-07-06 03:32:28 +00:00
},
"TestRememberMultiplePhrasesWithNoise": {
"difficulty": "medium",
"dependencies": [
"TestRememberMultipleIdsWithNoise"
],
"test": "agbenchmark/challenges/memory/m4",
"success": true
},
"TestSearch": {
"difficulty": "basic",
"dependencies": [
"TestWriteFile"
],
"test": "agbenchmark/challenges/interface/search",
"success": true
},
"TestWriteFile": {
"difficulty": "basic",
"dependencies": [],
"test": "agbenchmark/challenges/interface/write_file",
"success": true
},
"TestDebugSimpleTypoWithGuidance": {
"difficulty": "basic",
"dependencies": [
"TestReadFile",
"TestWriteFile"
],
"test": "agbenchmark/challenges/code/d1",
"success": true
},
"TestDebugSimpleTypoWithoutGuidance": {
"difficulty": "medium",
"dependencies": [
"TestDebugSimpleTypoWithGuidance"
],
"test": "agbenchmark/challenges/code/d2",
"success": true
}
2023-07-06 03:32:28 +00:00
}