Fix debug code challenge (#4632)

2023-06-09 08:40:06 -07:00 · 2023-06-09 08:40:06 -07:00 · 12ed5a957b
parent 3b0d49a3e0
commit 12ed5a957b
14 changed files with 143 additions and 104 deletions
--- a/tests/challenges/basic_abilities/test_write_file.py
+++ b/tests/challenges/basic_abilities/test_write_file.py
@ -6,7 +6,7 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import get_workspace_path, run_interaction_loop
 from tests.utils import requires_api_key

 CYCLE_COUNT_PER_LEVEL = [1, 1]
@ -34,7 +34,7 @@ def test_write_file(
    expected_outputs = EXPECTED_OUTPUTS_PER_LEVEL[level_to_run - 1]

    for file_name, expected_lines in expected_outputs.items():
-        file_path = str(file_system_agent.workspace.get_path(file_name))
+        file_path = get_workspace_path(file_system_agent, file_name)
        content = read_file(file_path, config)
        for expected_line in expected_lines:
            assert (
--- a/tests/challenges/current_score.json
+++ b/tests/challenges/current_score.json
@ -11,8 +11,8 @@
    },
    "debug_code": {
        "debug_code_challenge_a": {
-            "max_level": 1,
-            "max_level_beaten": null
+            "max_level": 2,
+            "max_level_beaten": 1
        }
    },
    "information_retrieval": {
--- a/tests/challenges/debug_code/data/two_sum.py
+++ b/tests/challenges/debug_code/data/two_sum.py
@ -2,18 +2,12 @@
 from typing import List, Optional


-def two_sum(nums: List, target: int) -> Optional[int]:
+def two_sum(nums: List, target: int) -> Optional[List[int]]:
    seen = {}
    for i, num in enumerate(nums):
+        typo
        complement = target - num
        if complement in seen:
            return [seen[complement], i]
        seen[num] = i
    return None
-
-
-# Example usage:
-nums = [2, 7, 11, 15]
-target = 9
-result = two_sum(nums, target)
-print(result)  # Output: [0, 1]
--- a/tests/challenges/debug_code/data/test.py
+++ b/tests/challenges/debug_code/data/test.py
@ -0,0 +1,31 @@
+# mypy: ignore-errors
+from code import two_sum
+from typing import List
+
+
+def test_two_sum(nums: List, target: int, expected_result: List[int]) -> None:
+    result = two_sum(nums, target)
+    print(result)
+    assert (
+        result == expected_result
+    ), f"AssertionError: Expected the output to be {expected_result}"
+
+
+if __name__ == "__main__":
+    # test the trivial case with the first two numbers
+    nums = [2, 7, 11, 15]
+    target = 9
+    expected_result = [0, 1]
+    test_two_sum(nums, target, expected_result)
+
+    # test for ability to use zero and the same number twice
+    nums = [2, 7, 0, 15, 12, 0]
+    target = 0
+    expected_result = [2, 5]
+    test_two_sum(nums, target, expected_result)
+
+    # test for first and last index usage and negative numbers
+    nums = [-6, 7, 11, 4]
+    target = -2
+    expected_result = [0, 3]
+    test_two_sum(nums, target, expected_result)
--- a/tests/challenges/debug_code/data/two_sum_tests.py
+++ b/tests/challenges/debug_code/data/two_sum_tests.py
@ -1,30 +0,0 @@
-# mypy: ignore-errors
-# we need a new line at the top of the file to avoid a syntax error
-
-
-def test_two_sum(nums, target, expected_result):
-    # These tests are appended to the two_sum file so we can ignore this error for now
-    result = two_sum(nums, target)
-    print(result)
-    assert (
-        result == expected_result
-    ), f"AssertionError: Expected the output to be {expected_result}"
-
-
-# test the trivial case with the first two numbers
-nums = [2, 7, 11, 15]
-target = 9
-expected_result = [0, 1]
-test_two_sum(nums, target, expected_result)
-
-# test for ability to use zero and the same number twice
-nums = [2, 7, 0, 15, 12, 0]
-target = 0
-expected_result = [2, 5]
-test_two_sum(nums, target, expected_result)
-
-# test for first and last index usage and negative numbers
-nums = [-6, 7, 11, 4]
-target = -2
-expected_result = [0, 3]
-test_two_sum(nums, target, expected_result)
--- a/tests/challenges/debug_code/test_debug_code_challenge_a.py
+++ b/tests/challenges/debug_code/test_debug_code_challenge_a.py
@ -5,20 +5,27 @@ from pytest_mock import MockerFixture

 from autogpt.agent import Agent
 from autogpt.commands.execute_code import execute_python_file
-from autogpt.commands.file_operations import append_to_file, write_to_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import (
+    copy_file_into_workspace,
+    get_workspace_path,
+    run_interaction_loop,
+)
 from tests.utils import requires_api_key

 CYCLE_COUNT = 5
+EXPECTED_VALUES = ["[0, 1]", "[2, 5]", "[0, 3]"]
+DIRECTORY_PATH = Path(__file__).parent / "data"
+CODE_FILE_PATH = "code.py"
+TEST_FILE_PATH = "test.py"


@pytest.mark.vcr
@requires_api_key("OPENAI_API_KEY")
@challenge
 def test_debug_code_challenge_a(
-    debug_code_agent: Agent,
+    debug_code_agents: Agent,
    monkeypatch: pytest.MonkeyPatch,
    patched_api_requestor: MockerFixture,
    config: Config,
@ -33,17 +40,20 @@ def test_debug_code_challenge_a(
    :config: The config object for the agent.
    :level_to_run: The level to run.
    """
+    debug_code_agent = debug_code_agents[level_to_run - 1]

-    file_path = str(debug_code_agent.workspace.get_path("code.py"))
-
-    code_file_path = Path(__file__).parent / "data" / "two_sum.py"
-    test_file_path = Path(__file__).parent / "data" / "two_sum_tests.py"
-
-    write_to_file(file_path, code_file_path.read_text(), config)
+    copy_file_into_workspace(debug_code_agent, DIRECTORY_PATH, CODE_FILE_PATH)
+    copy_file_into_workspace(debug_code_agent, DIRECTORY_PATH, TEST_FILE_PATH)

    run_interaction_loop(monkeypatch, debug_code_agent, CYCLE_COUNT)

-    append_to_file(file_path, test_file_path.read_text(), config)
+    output = execute_python_file(
+        get_workspace_path(debug_code_agent, TEST_FILE_PATH), config
+    )

-    output = execute_python_file(file_path, config)
    assert "error" not in output.lower(), f"Errors found in output: {output}!"
+
+    for expected_value in EXPECTED_VALUES:
+        assert (
+            expected_value in output
+        ), f"Expected output to contain {expected_value}, but it was not found in {output}!"
--- a/tests/challenges/information_retrieval/test_information_retrieval_challenge_a.py
+++ b/tests/challenges/information_retrieval/test_information_retrieval_challenge_a.py
@ -4,13 +4,15 @@ from pytest_mock import MockerFixture
 from autogpt.commands.file_operations import read_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import get_workspace_path, run_interaction_loop
 from tests.utils import requires_api_key

 CYCLE_COUNT = 3
 EXPECTED_REVENUES = [["81"], ["81"], ["81", "53", "24", "21", "11", "7", "4", "3", "2"]]
 from autogpt.agent import Agent

+OUTPUT_LOCATION = "output.txt"
+

@pytest.mark.vcr
@requires_api_key("OPENAI_API_KEY")
@ -31,7 +33,7 @@ def test_information_retrieval_challenge_a(
    information_retrieval_agent = information_retrieval_agents[level_to_run - 1]
    run_interaction_loop(monkeypatch, information_retrieval_agent, CYCLE_COUNT)

-    file_path = str(information_retrieval_agent.workspace.get_path("output.txt"))
+    file_path = get_workspace_path(information_retrieval_agent, OUTPUT_LOCATION)
    content = read_file(file_path, config)
    expected_revenues = EXPECTED_REVENUES[level_to_run - 1]
    for revenue in expected_revenues:
--- a/tests/challenges/information_retrieval/test_information_retrieval_challenge_b.py
+++ b/tests/challenges/information_retrieval/test_information_retrieval_challenge_b.py
@ -7,10 +7,11 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import get_workspace_path, run_interaction_loop
 from tests.utils import requires_api_key

 CYCLE_COUNT = 3
+OUTPUT_LOCATION = "2010_nobel_prize_winners.txt"


@pytest.mark.vcr
@ -35,10 +36,8 @@ def test_information_retrieval_challenge_b(

    with contextlib.suppress(SystemExit):
        run_interaction_loop(monkeypatch, get_nobel_prize_agent, CYCLE_COUNT)
+    file_path = get_workspace_path(get_nobel_prize_agent, OUTPUT_LOCATION)

-    file_path = str(
-        get_nobel_prize_agent.workspace.get_path("2010_nobel_prize_winners.txt")
-    )
    content = read_file(file_path, config)
    assert "Andre Geim" in content, "Expected the file to contain Andre Geim"
    assert (
--- a/tests/challenges/kubernetes/test_kubernetes_template_challenge_a.py
+++ b/tests/challenges/kubernetes/test_kubernetes_template_challenge_a.py
@ -6,10 +6,11 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import get_workspace_path, run_interaction_loop
 from tests.utils import requires_api_key

 CYCLE_COUNT = 3
+OUTPUT_LOCATION = "kube.yaml"


@pytest.mark.vcr
@ -34,7 +35,7 @@ def test_kubernetes_template_challenge_a(
    """
    run_interaction_loop(monkeypatch, kubernetes_agent, CYCLE_COUNT)

-    file_path = str(kubernetes_agent.workspace.get_path("kube.yaml"))
+    file_path = get_workspace_path(kubernetes_agent, OUTPUT_LOCATION)
    content = read_file(file_path, config)

    for word in ["apiVersion", "kind", "metadata", "spec"]:
--- a/tests/challenges/memory/test_memory_challenge_a.py
+++ b/tests/challenges/memory/test_memory_challenge_a.py
@ -5,9 +5,11 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file, write_to_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import run_interaction_loop
+from tests.challenges.utils import get_workspace_path, run_interaction_loop
 from tests.utils import requires_api_key

+OUTPUT_LOCATION = "output.txt"
+

@pytest.mark.vcr
@requires_api_key("OPENAI_API_KEY")
@ -35,7 +37,7 @@ def test_memory_challenge_a(

    run_interaction_loop(monkeypatch, memory_management_agent, level_to_run + 2)

-    file_path = str(memory_management_agent.workspace.get_path("output.txt"))
+    file_path = get_workspace_path(memory_management_agent, OUTPUT_LOCATION)
    content = read_file(file_path, config)
    assert task_id in content, f"Expected the file to contain {task_id}"

@ -58,7 +60,7 @@ def create_instructions_files(
    for i in range(1, num_files + 1):
        content = generate_content(i, task_id, base_filename, num_files)
        file_name = f"{base_filename}{i}.txt"
-        file_path = str(memory_management_agent.workspace.get_path(file_name))
+        file_path = get_workspace_path(memory_management_agent, file_name)
        write_to_file(file_path, content, config)


--- a/tests/challenges/memory/test_memory_challenge_b.py
+++ b/tests/challenges/memory/test_memory_challenge_b.py
@ -5,10 +5,15 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file, write_to_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import generate_noise, run_interaction_loop
+from tests.challenges.utils import (
+    generate_noise,
+    get_workspace_path,
+    run_interaction_loop,
+)
 from tests.utils import requires_api_key

 NOISE = 1000
+OUTPUT_LOCATION = "output.txt"


@pytest.mark.vcr
@ -36,7 +41,7 @@ def test_memory_challenge_b(

    run_interaction_loop(monkeypatch, memory_management_agent, level_to_run + 2)

-    file_path = str(memory_management_agent.workspace.get_path("output.txt"))
+    file_path = get_workspace_path(memory_management_agent, OUTPUT_LOCATION)
    content = read_file(file_path, config)
    for task_id in task_ids:
        assert task_id in content, f"Expected the file to contain {task_id}"
@ -61,7 +66,8 @@ def create_instructions_files(
    for i in range(1, level + 1):
        content = generate_content(i, task_ids, base_filename, level)
        file_name = f"{base_filename}{i}.txt"
-        file_path = str(memory_management_agent.workspace.get_path(file_name))
+        file_path = get_workspace_path(memory_management_agent, file_name)
+
        write_to_file(file_path, content, config)


--- a/tests/challenges/memory/test_memory_challenge_c.py
+++ b/tests/challenges/memory/test_memory_challenge_c.py
@ -5,10 +5,15 @@ from autogpt.agent import Agent
 from autogpt.commands.file_operations import read_file, write_to_file
 from autogpt.config import Config
 from tests.challenges.challenge_decorator.challenge_decorator import challenge
-from tests.challenges.utils import generate_noise, run_interaction_loop
+from tests.challenges.utils import (
+    generate_noise,
+    get_workspace_path,
+    run_interaction_loop,
+)
 from tests.utils import requires_api_key

 NOISE = 1000
+OUTPUT_LOCATION = "output.txt"


 # @pytest.mark.vcr
@ -53,8 +58,7 @@ def test_memory_challenge_c(
    )

    run_interaction_loop(monkeypatch, memory_management_agent, level_to_run + 2)
-
-    file_path = str(memory_management_agent.workspace.get_path("output.txt"))
+    file_path = get_workspace_path(memory_management_agent, OUTPUT_LOCATION)
    content = read_file(file_path, config)
    for phrase in level_silly_phrases:
        assert phrase in content, f"Expected the file to contain {phrase}"
@ -79,7 +83,7 @@ def create_instructions_files(
    for i in range(1, level + 1):
        content = generate_content(i, task_ids, base_filename, level)
        file_name = f"{base_filename}{i}.txt"
-        file_path = str(memory_management_agent.workspace.get_path(file_name))
+        file_path = get_workspace_path(memory_management_agent, file_name)
        write_to_file(file_path, content, config)


--- a/tests/challenges/utils.py
+++ b/tests/challenges/utils.py
@ -1,5 +1,7 @@
 import contextlib
 import random
+import shutil
+from pathlib import Path
 from typing import Generator

 import pytest
@ -42,3 +44,15 @@ def run_interaction_loop(
    setup_mock_input(monkeypatch, cycle_count)
    with contextlib.suppress(SystemExit):
        agent.start_interaction_loop()
+
+
+def get_workspace_path(agent: Agent, file_name: str) -> str:
+    return str(agent.workspace.get_path(file_name))
+
+
+def copy_file_into_workspace(
+    agent: Agent, directory_path: Path, file_path: str
+) -> None:
+    workspace_code_file_path = get_workspace_path(agent, file_path)
+    code_file_path = directory_path / file_path
+    shutil.copy(code_file_path, workspace_code_file_path)
--- a/tests/integration/agent_factory.py
+++ b/tests/integration/agent_factory.py
@ -240,41 +240,47 @@ def get_nobel_prize_agent(agent_test_config, memory_json_file, workspace: Worksp


@pytest.fixture
-def debug_code_agent(agent_test_config, memory_json_file, workspace: Workspace):
-    command_registry = CommandRegistry()
-    command_registry.import_commands("autogpt.commands.file_operations")
-    command_registry.import_commands("autogpt.commands.execute_code")
-    command_registry.import_commands("autogpt.commands.improve_code")
-    command_registry.import_commands("autogpt.app")
-    command_registry.import_commands("autogpt.commands.task_statuses")
-
-    ai_config = AIConfig(
-        ai_name="Debug Code Agent",
-        ai_role="an autonomous agent that specializes in debugging python code",
-        ai_goals=[
-            "1-Run the code in the file named 'code.py' using the execute_code command.",
-            "2-Read code.py to understand why the code is not working as expected.",
-            "3-Modify code.py to fix the error.",
-            "Repeat step 1, 2 and 3 until the code is working as expected. When you're done use the task_complete command.",
-            "Do not use any other commands than execute_python_file and write_file",
+def debug_code_agents(agent_test_config, memory_json_file, workspace: Workspace):
+    agents = []
+    goals = [
+        [
+            "1- Run test.py using the execute_python_file command.",
+            "2- Read code.py using the read_file command.",
+            "3- Modify code.py using the write_to_file command."
+            "Repeat step 1, 2 and 3 until test.py runs without errors.",
        ],
-    )
-    ai_config.command_registry = command_registry
+        [
+            "1- Run test.py.",
+            "2- Read code.py.",
+            "3- Modify code.py."
+            "Repeat step 1, 2 and 3 until test.py runs without errors.",
+        ],
+        ["1- Make test.py run without errors."],
+    ]

-    system_prompt = ai_config.construct_full_prompt()
-    Config().set_continuous_mode(False)
-    agent = Agent(
-        ai_name="Debug Code Agent",
-        memory=memory_json_file,
-        command_registry=command_registry,
-        config=ai_config,
-        next_action_count=0,
-        system_prompt=system_prompt,
-        triggering_prompt=DEFAULT_TRIGGERING_PROMPT,
-        workspace_directory=workspace.root,
-    )
-
-    return agent
+    for goal in goals:
+        ai_config = AIConfig(
+            ai_name="Debug Code Agent",
+            ai_role="an autonomous agent that specializes in debugging python code",
+            ai_goals=goal,
+        )
+        command_registry = get_command_registry(agent_test_config)
+        ai_config.command_registry = command_registry
+        system_prompt = ai_config.construct_full_prompt()
+        Config().set_continuous_mode(False)
+        agents.append(
+            Agent(
+                ai_name="Debug Code Agent",
+                memory=memory_json_file,
+                command_registry=command_registry,
+                config=ai_config,
+                next_action_count=0,
+                system_prompt=system_prompt,
+                triggering_prompt=DEFAULT_TRIGGERING_PROMPT,
+                workspace_directory=workspace.root,
+            )
+        )
+    return agents


 def get_command_registry(agent_test_config):