AutoGPT/benchmark/agbenchmark/challenges/deprecated/code/d2.2_vague/data.json

34 lines
842 B
JSON

{
"category": [
"code",
"iterate"
],
"cutoff": 75,
"dependencies": [
"TestDebugSimpleTypoWithGuidance"
],
"eval_id": "1d171b68-0374-4b08-ae6a-c7223f89ecc1",
"ground": {
"answer": "[0, 1] [2, 5] [0, 3]",
"eval": {
"type": "python"
},
"files": [
"test.py"
],
"should_contain": [
"[0, 1]",
"[2, 5]",
"[0, 3]"
],
"should_not_contain": []
},
"info": {
"description": "Tests ability for the agent to debug python code with a simple typo in it, using a very broad prompt without guidance",
"difficulty": "intermediate",
"side_effects": []
},
"name": "DebugSimpleTypoWithoutGuidance",
"task": "Make test.py run without errors."
}