AutoGPT/agbenchmark/start_benchmark.py

import json
import os
import sys
from pathlib import Path
from typing import Any

import click
import pytest
from dotenv import load_dotenv

load_dotenv()

CURRENT_DIRECTORY = Path(__file__).resolve().parent


CONFIG_PATH = str(Path(os.getcwd()) / "config.json")

REGRESSION_TESTS_PATH = str(Path(os.getcwd()) / "regression_tests.json")


@click.group()
def cli() -> None:
    pass


@cli.command()
@click.option("--category", default=None, help="Specific category to run")
@click.option("--maintain", is_flag=True, help="Runs only regression tests")
@click.option("--improve", is_flag=True, help="Run only non-regression tests")
@click.option("--mock", is_flag=True, help="Run with mock")
def start(category: str, maintain: bool, improve: bool, mock: bool) -> int:
    """Start the benchmark tests. If a category flag is provided, run the categories with that mark."""
    # Check if configuration file exists and is not empty
    if maintain and improve:
        print(
            "Error: You can't use both --maintain and --improve at the same time. Please choose one."
        )
        return 1

    if not os.path.exists(CONFIG_PATH) or os.stat(CONFIG_PATH).st_size == 0:
        config = {}

        config["workspace"] = click.prompt(
            "Please enter a new workspace path",
            default=os.path.join(Path.home(), "workspace"),
        )

        config["entry_path"] = click.prompt(
            "Please enter a the path to your run_specific_agent function implementation",
            default="/benchmarks.py",
        )

        config["cutoff"] = click.prompt(
            "Please enter a hard cutoff runtime for your agent",
            default="60",
        )

        with open(CONFIG_PATH, "w") as f:
            json.dump(config, f)
    else:
        # If the configuration file exists and is not empty, load it
        with open(CONFIG_PATH, "r") as f:
            config = json.load(f)

    os.environ["MOCK_TEST"] = "True" if mock else "False"

    if not os.path.exists(REGRESSION_TESTS_PATH):
        with open(REGRESSION_TESTS_PATH, "a"):
            pass

    print("Current configuration:")
    for key, value in config.items():
        print(f"{key}: {value}")

    pytest_args = ["-vs"]
    if category:
        pytest_args.extend(["-m", category])
        print("Starting benchmark tests ", category)
    else:
        print("Running all categories")

    if maintain:
        print("Running only regression tests")
        pytest_args.append("--maintain")
    elif improve:
        print("Running only non-regression tests")
        pytest_args.append("--improve")

    if mock:
        pytest_args.append("--mock")

    # when used as a library, the pytest directory to execute is in the CURRENT_DIRECTORY
    pytest_args.append(str(CURRENT_DIRECTORY))

    return sys.exit(pytest.main(pytest_args))


def get_regression_data() -> Any:
    with open(REGRESSION_TESTS_PATH, "r") as file:
        data = json.load(file)

    return data


if __name__ == "__main__":
    start()
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`import json`
			`import os`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`import sys`
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00			`from pathlib import Path`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`from typing import Any`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00
			`import click`
			`import pytest`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`from dotenv import load_dotenv`
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00
			`load_dotenv()`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`CURRENT_DIRECTORY = Path(__file__).resolve().parent`


Integrate with gpt engineer (#47) 2023-07-03 18:53:28 +00:00			`CONFIG_PATH = str(Path(os.getcwd()) / "config.json")`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00
			`REGRESSION_TESTS_PATH = str(Path(os.getcwd()) / "regression_tests.json")`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`@click.group()`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`def cli() -> None:`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`pass`


			`@cli.command()`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`@click.option("--category", default=None, help="Specific category to run")`
Rename '--reg' flag to '--maintain' (#58) 2023-07-06 04:03:45 +00:00			`@click.option("--maintain", is_flag=True, help="Runs only regression tests")`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`@click.option("--improve", is_flag=True, help="Run only non-regression tests")`
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00			`@click.option("--mock", is_flag=True, help="Run with mock")`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`def start(category: str, maintain: bool, improve: bool, mock: bool) -> int:`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`"""Start the benchmark tests. If a category flag is provided, run the categories with that mark."""`
			`# Check if configuration file exists and is not empty`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`if maintain and improve:`
			`print(`
			`"Error: You can't use both --maintain and --improve at the same time. Please choose one."`
			`)`
			`return 1`

Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`if not os.path.exists(CONFIG_PATH) or os.stat(CONFIG_PATH).st_size == 0:`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`config = {}`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00
			`config["workspace"] = click.prompt(`
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00			`"Please enter a new workspace path",`
integrate config, agent_interface just func, hook 2023-06-30 15:55:43 +00:00			`default=os.path.join(Path.home(), "workspace"),`
			`)`

local runs, home_path config, submodule miniagi (#50) 2023-07-04 17:23:00 +00:00			`config["entry_path"] = click.prompt(`
integrate config, agent_interface just func, hook 2023-06-30 15:55:43 +00:00			`"Please enter a the path to your run_specific_agent function implementation",`
			`default="/benchmarks.py",`
			`)`

			`config["cutoff"] = click.prompt(`
			`"Please enter a hard cutoff runtime for your agent",`
			`default="60",`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`)`

Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`with open(CONFIG_PATH, "w") as f:`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`json.dump(config, f)`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`else:`
			`# If the configuration file exists and is not empty, load it`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`with open(CONFIG_PATH, "r") as f:`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`config = json.load(f)`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`os.environ["MOCK_TEST"] = "True" if mock else "False"`
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`if not os.path.exists(REGRESSION_TESTS_PATH):`
			`with open(REGRESSION_TESTS_PATH, "a"):`
regression test creation 2023-06-27 17:25:47 +00:00			`pass`

Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`print("Current configuration:")`
			`for key, value in config.items():`
			`print(f"{key}: {value}")`

Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`pytest_args = ["-vs"]`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00			`if category:`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`pytest_args.extend(["-m", category])`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`print("Starting benchmark tests ", category)`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`else:`
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`print("Running all categories")`

			`if maintain:`
			`print("Running only regression tests")`
			`pytest_args.append("--maintain")`
			`elif improve:`
			`print("Running only non-regression tests")`
			`pytest_args.append("--improve")`
Add automatic regression markers (#38) 2023-06-22 12:18:22 +00:00
mini-agi, simple challenge creation, --mock flag 2023-06-27 22:17:54 +00:00			`if mock:`
			`pytest_args.append("--mock")`

Add gpt engineer to ci (#78) 2023-07-09 20:31:31 +00:00			`# when used as a library, the pytest directory to execute is in the CURRENT_DIRECTORY`
			`pytest_args.append(str(CURRENT_DIRECTORY))`

Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`return sys.exit(pytest.main(pytest_args))`
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00
Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`def get_regression_data() -> Any:`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`with open(REGRESSION_TESTS_PATH, "r") as file:`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`data = json.load(file)`

Quality of life improvements & fixes (#75) 2023-07-09 01:43:38 +00:00			`return data`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00
start click, fixtures, types, challenge creation, mock run -stable (#37) 2023-06-21 15:43:18 +00:00			`if __name__ == "__main__":`
			`start()`