AutoGPT/benchmark/agbenchmark/agent_interface.py

import os
import platform
import queue
import select
import shutil
import subprocess
import sys
import time
from threading import Thread
from typing import Any, List

import psutil
from dotenv import load_dotenv

import agbenchmark.start_benchmark

load_dotenv()

helicone_graphql_logs = os.getenv("HELICONE_GRAPHQL_LOGS")
HELICONE_GRAPHQL_LOGS = (
    helicone_graphql_logs.lower() == "true" if helicone_graphql_logs else False
)


def run_linux_env(process: Any, start_time: float, timeout: float) -> None:
    while True:
        try:
            # This checks if there's data to be read from stdout without blocking.
            if process.stdout and select.select([process.stdout], [], [], 0)[0]:
                output = process.stdout.readline()
                print(output.strip())
        except Exception as e:
            continue

        # Check if process has ended, has no more output, or exceeded timeout
        if process.poll() is not None or (time.time() - start_time > timeout):
            break

    if time.time() - start_time > timeout:
        print("The Python function has exceeded the time limit and was terminated.")
        parent = psutil.Process(process.pid)
        for child in parent.children(recursive=True):
            child.kill()
        parent.kill()

    else:
        print("The Python function has finished running.")


def enqueue_output(out: Any, my_queue: Any) -> None:
    for line in iter(out.readline, b""):
        my_queue.put(line)
    out.close()


def run_windows_env(process: Any, start_time: float, timeout: float) -> None:
    my_queue: Any = queue.Queue()
    thread = Thread(target=enqueue_output, args=(process.stdout, my_queue))
    thread.daemon = True
    thread.start()

    while True:
        try:
            output = my_queue.get_nowait().strip()
            print(output)
        except queue.Empty:
            pass

        if process.poll() is not None or (time.time() - start_time > timeout):
            break

    if time.time() - start_time > timeout:
        print("The Python function has exceeded the time limit and was terminated.")
        process.terminate()


def run_agent(task: str, timeout: int) -> None:
    """Calling to get a response"""

    entry_path = "agbenchmark.benchmarks"

    print(f"Running '{entry_path}' with timeout {timeout}")

    command = [sys.executable, "-m", entry_path, str(task)]
    process = subprocess.Popen(
        command,
        stdout=subprocess.PIPE,
        stderr=subprocess.STDOUT,
        universal_newlines=True,
        cwd=agbenchmark.start_benchmark.HOME_DIRECTORY,
        bufsize=1,
    )

    start_time = time.time()

    if platform.system() == "Windows":
        run_windows_env(process, start_time, timeout)
    else:
        run_linux_env(process, start_time, timeout)

    process.wait()

    if process.returncode != 0:
        print(f"The agent timed out")


def get_list_of_file_paths(
    challenge_dir_path: str, artifact_folder_name: str
) -> List[str]:
    # this file is at agbenchmark\agent_interface.py
    source_dir = os.path.join(
        agbenchmark.start_benchmark.CURRENT_DIRECTORY,
        "..",
        challenge_dir_path,
        artifact_folder_name,
    )
    if not os.path.exists(source_dir):
        return []
    return [os.path.join(source_dir, file_name) for file_name in os.listdir(source_dir)]


def copy_artifacts_into_workspace(
    workspace: str | dict[str, str], artifact_folder_name: str, challenge_dir_path: str
) -> None:
    if isinstance(workspace, dict):
        if artifact_folder_name == "artifacts_in":
            workspace = workspace["input"]
        else:
            workspace = workspace["output"]
    file_paths = get_list_of_file_paths(challenge_dir_path, artifact_folder_name)
    for file_path in file_paths:
        if os.path.isfile(file_path):
            shutil.copy(file_path, workspace)
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`import os`
adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00			`import platform`
			`import queue`
Fix timeout not working (#218) 2023-07-31 02:05:09 +00:00			`import select`
Add 'Debug simple typo with guidance' challenge (#65) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-07-07 20:50:53 +00:00			`import shutil`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`import subprocess`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00			`import sys`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00			`import time`
adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00			`from threading import Thread`
			`from typing import Any, List`
Add static linters ci (#45) 2023-07-02 20:14:49 +00:00
Kill all subprocesses (#265) Co-authored-by: merwanehamadi <merwanehamadi@gmail.com> 2023-08-07 04:12:10 +00:00			`import psutil`
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00			`from dotenv import load_dotenv`

adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00			`import agbenchmark.start_benchmark`
Fix tests ci (#82) 2023-07-11 04:54:25 +00:00
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00			`load_dotenv()`

Remove graphql logs (#264) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 19:22:49 +00:00			`helicone_graphql_logs = os.getenv("HELICONE_GRAPHQL_LOGS")`
			`HELICONE_GRAPHQL_LOGS = (`
			`helicone_graphql_logs.lower() == "true" if helicone_graphql_logs else False`
			`)`
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00

adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00			`def run_linux_env(process: Any, start_time: float, timeout: float) -> None:`
Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`while True:`
			`try:`
			`# This checks if there's data to be read from stdout without blocking.`
			`if process.stdout and select.select([process.stdout], [], [], 0)[0]:`
			`output = process.stdout.readline()`
			`print(output.strip())`
			`except Exception as e:`
			`continue`
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00
Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`# Check if process has ended, has no more output, or exceeded timeout`
			`if process.poll() is not None or (time.time() - start_time > timeout):`
			`break`
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00
Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`if time.time() - start_time > timeout:`
			`print("The Python function has exceeded the time limit and was terminated.")`
Kill all subprocesses (#265) Co-authored-by: merwanehamadi <merwanehamadi@gmail.com> 2023-08-07 04:12:10 +00:00			`parent = psutil.Process(process.pid)`
			`for child in parent.children(recursive=True):`
			`child.kill()`
			`parent.kill()`

Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`else:`
			`print("The Python function has finished running.")`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00
adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00
			`def enqueue_output(out: Any, my_queue: Any) -> None:`
			`for line in iter(out.readline, b""):`
			`my_queue.put(line)`
			`out.close()`


			`def run_windows_env(process: Any, start_time: float, timeout: float) -> None:`
			`my_queue: Any = queue.Queue()`
			`thread = Thread(target=enqueue_output, args=(process.stdout, my_queue))`
			`thread.daemon = True`
			`thread.start()`

			`while True:`
			`try:`
			`output = my_queue.get_nowait().strip()`
			`print(output)`
			`except queue.Empty:`
			`pass`

			`if process.poll() is not None or (time.time() - start_time > timeout):`
			`break`

			`if time.time() - start_time > timeout:`
			`print("The Python function has exceeded the time limit and was terminated.")`
			`process.terminate()`


			`def run_agent(task: str, timeout: int) -> None:`
			`"""Calling to get a response"""`

			`entry_path = "agbenchmark.benchmarks"`

			`print(f"Running '{entry_path}' with timeout {timeout}")`

			`command = [sys.executable, "-m", entry_path, str(task)]`
			`process = subprocess.Popen(`
			`command,`
			`stdout=subprocess.PIPE,`
			`stderr=subprocess.STDOUT,`
			`universal_newlines=True,`
			`cwd=agbenchmark.start_benchmark.HOME_DIRECTORY,`
			`bufsize=1,`
			`)`

			`start_time = time.time()`

			`if platform.system() == "Windows":`
			`run_windows_env(process, start_time, timeout)`
			`else:`
			`run_linux_env(process, start_time, timeout)`

Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`process.wait()`
Integrate one challenge to auto gpt (#44) 2023-07-02 14:38:30 +00:00
Add agent protocol interface test (#259) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-08-06 01:00:05 +00:00			`if process.returncode != 0:`
			`print(f"The agent timed out")`
Fix Auto-GPT looping forever (#87) 2023-07-12 00:02:29 +00:00
moving run agent to tests & agnostic run working 2023-06-30 14:50:54 +00:00
Use agent protocol (#278) Signed-off-by: Jakub Novak <jakub@e2b.dev> 2023-08-11 07:04:08 +00:00			`def get_list_of_file_paths(`
			`challenge_dir_path: str, artifact_folder_name: str`
			`) -> List[str]:`
Added --test, consolidate files, reports working (#83) 2023-07-11 02:25:19 +00:00			`# this file is at agbenchmark\agent_interface.py`
Fix tests ci (#82) 2023-07-11 04:54:25 +00:00			`source_dir = os.path.join(`
adding backend and a basic ui (#309) 2023-08-27 07:18:30 +00:00			`agbenchmark.start_benchmark.CURRENT_DIRECTORY,`
			`"..",`
			`challenge_dir_path,`
			`artifact_folder_name,`
Fix tests ci (#82) 2023-07-11 04:54:25 +00:00			`)`
Add 'Debug simple typo with guidance' challenge (#65) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-07-07 20:50:53 +00:00			`if not os.path.exists(source_dir):`
Use agent protocol (#278) Signed-off-by: Jakub Novak <jakub@e2b.dev> 2023-08-11 07:04:08 +00:00			`return []`
			`return [os.path.join(source_dir, file_name) for file_name in os.listdir(source_dir)]`

Add 'Debug simple typo with guidance' challenge (#65) Signed-off-by: Merwane Hamadi <merwanehamadi@gmail.com> 2023-07-07 20:50:53 +00:00
Use agent protocol (#278) Signed-off-by: Jakub Novak <jakub@e2b.dev> 2023-08-11 07:04:08 +00:00			`def copy_artifacts_into_workspace(`
mock flag, workspace io fixes, mark fixes 2023-08-11 12:22:21 +00:00			`workspace: str \| dict[str, str], artifact_folder_name: str, challenge_dir_path: str`
Use agent protocol (#278) Signed-off-by: Jakub Novak <jakub@e2b.dev> 2023-08-11 07:04:08 +00:00			`) -> None:`
mock flag, workspace io fixes, mark fixes 2023-08-11 12:22:21 +00:00			`if isinstance(workspace, dict):`
			`if artifact_folder_name == "artifacts_in":`
			`workspace = workspace["input"]`
			`else:`
			`workspace = workspace["output"]`
Use agent protocol (#278) Signed-off-by: Jakub Novak <jakub@e2b.dev> 2023-08-11 07:04:08 +00:00			`file_paths = get_list_of_file_paths(challenge_dir_path, artifact_folder_name)`
			`for file_path in file_paths:`
			`if os.path.isfile(file_path):`
			`shutil.copy(file_path, workspace)`