AutoGPT/autogpt/llm_utils.py

from __future__ import annotations

import time
from typing import List, Optional

import openai
from colorama import Fore, Style
from openai.error import APIError, RateLimitError

from autogpt.config import Config
from autogpt.logs import logger
from autogpt.types.openai import Message

CFG = Config()

openai.api_key = CFG.openai_api_key


def call_ai_function(
    function: str, args: list, description: str, model: str | None = None
) -> str:
    """Call an AI function

    This is a magic function that can do anything with no-code. See
    https://github.com/Torantulino/AI-Functions for more info.

    Args:
        function (str): The function to call
        args (list): The arguments to pass to the function
        description (str): The description of the function
        model (str, optional): The model to use. Defaults to None.

    Returns:
        str: The response from the function
    """
    if model is None:
        model = CFG.smart_llm_model
    # For each arg, if any are None, convert to "None":
    args = [str(arg) if arg is not None else "None" for arg in args]
    # parse args to comma separated string
    args: str = ", ".join(args)
    messages: List[Message] = [
        {
            "role": "system",
            "content": f"You are now the following python function: ```# {description}"
            f"\n{function}```\n\nOnly respond with your `return` value.",
        },
        {"role": "user", "content": args},
    ]

    return create_chat_completion(model=model, messages=messages, temperature=0)


# Overly simple abstraction until we create something better
# simple retry mechanism when getting a rate error or a bad gateway
def create_chat_completion(
    messages: List[Message],  # type: ignore
    model: Optional[str] = None,
    temperature: float = CFG.temperature,
    max_tokens: Optional[int] = None,
) -> str:
    """Create a chat completion using the OpenAI API

    Args:
        messages (List[Message]): The messages to send to the chat completion
        model (str, optional): The model to use. Defaults to None.
        temperature (float, optional): The temperature to use. Defaults to 0.9.
        max_tokens (int, optional): The max tokens to use. Defaults to None.

    Returns:
        str: The response from the chat completion
    """
    num_retries = 10
    warned_user = False
    if CFG.debug_mode:
        print(
            f"{Fore.GREEN}Creating chat completion with model {model}, temperature {temperature}, max_tokens {max_tokens}{Fore.RESET}"
        )
    for plugin in CFG.plugins:
        if plugin.can_handle_chat_completion(
            messages=messages,
            model=model,
            temperature=temperature,
            max_tokens=max_tokens,
        ):
            message = plugin.handle_chat_completion(
                messages=messages,
                model=model,
                temperature=temperature,
                max_tokens=max_tokens,
            )
            if message is not None:
                return message
    response = None
    for attempt in range(num_retries):
        backoff = 2 ** (attempt + 2)
        try:
            if CFG.use_azure:
                response = openai.ChatCompletion.create(
                    deployment_id=CFG.get_azure_deployment_id_for_model(model),
                    model=model,
                    messages=messages,
                    temperature=temperature,
                    max_tokens=max_tokens,
                )
            else:
                response = openai.ChatCompletion.create(
                    model=model,
                    messages=messages,
                    temperature=temperature,
                    max_tokens=max_tokens,
                )
            break
        except RateLimitError:
            if CFG.debug_mode:
                print(
                    f"{Fore.RED}Error: ", f"Reached rate limit, passing...{Fore.RESET}"
                )
            if not warned_user:
                logger.double_check(
                    f"Please double check that you have setup a {Fore.CYAN + Style.BRIGHT}PAID{Style.RESET_ALL} OpenAI API Account. "
                    + f"You can read more here: {Fore.CYAN}https://github.com/Significant-Gravitas/Auto-GPT#openai-api-keys-configuration{Fore.RESET}"
                )
                warned_user = True
        except APIError as e:
            if e.http_status != 502:
                raise
            if attempt == num_retries - 1:
                raise
        if CFG.debug_mode:
            print(
                f"{Fore.RED}Error: ",
                f"API Bad gateway. Waiting {backoff} seconds...{Fore.RESET}",
            )
        time.sleep(backoff)
    if response is None:
        logger.typewriter_log(
            "FAILED TO GET RESPONSE FROM OPENAI",
            Fore.RED,
            "Auto-GPT has failed to get a response from OpenAI's services. "
            + f"Try running Auto-GPT again, and if the problem the persists try running it with `{Fore.CYAN}--debug{Fore.RESET}`.",
        )
        logger.double_check()
        if CFG.debug_mode:
            raise RuntimeError(f"Failed to get response after {num_retries} retries")
        else:
            quit(1)
    resp = response.choices[0].message["content"]
    for plugin in CFG.plugins:
        if not plugin.can_handle_on_response():
            continue
        resp = plugin.on_response(resp)
    return resp


def create_embedding_with_ada(text) -> list:
    """Create an embedding with text-ada-002 using the OpenAI SDK"""
    num_retries = 10
    for attempt in range(num_retries):
        backoff = 2 ** (attempt + 2)
        try:
            if CFG.use_azure:
                return openai.Embedding.create(
                    input=[text],
                    engine=CFG.get_azure_deployment_id_for_model(
                        "text-embedding-ada-002"
                    ),
                )["data"][0]["embedding"]
            else:
                return openai.Embedding.create(
                    input=[text], model="text-embedding-ada-002"
                )["data"][0]["embedding"]
        except RateLimitError:
            pass
        except APIError as e:
            if e.http_status != 502:
                raise
            if attempt == num_retries - 1:
                raise
        if CFG.debug_mode:
            print(
                f"{Fore.RED}Error: ",
                f"API Bad gateway. Waiting {backoff} seconds...{Fore.RESET}",
            )
        time.sleep(backoff)
unify annotations to future syntax 2023-04-16 18:02:48 +00:00			`from __future__ import annotations`

Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`import time`
:bug: Minor type fixes 2023-04-17 19:42:17 +00:00			`from typing import List, Optional`
formatting 2023-04-14 19:42:28 +00:00
Consolidate calls to openai Starting to abstract away the calls to openai 2023-04-03 02:51:07 +00:00			`import openai`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`from colorama import Fore, Style`
Finish integrating command registry 2023-04-17 02:51:36 +00:00			`from openai.error import APIError, RateLimitError`
formatting 2023-04-14 19:42:28 +00:00
Convert to python module named autogpt. Also fixed the Dockerfile. Converting to module makes development easier. Fixes coverage script in CI and test imports. 2023-04-14 16:28:58 +00:00			`from autogpt.config import Config`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`from autogpt.logs import logger`
isort, add proper skips. 2023-04-18 23:59:23 +00:00			`from autogpt.types.openai import Message`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`CFG = Config()`
Consolidate calls to openai Starting to abstract away the calls to openai 2023-04-03 02:51:07 +00:00
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`openai.api_key = CFG.openai_api_key`


			`def call_ai_function(`
unify annotations to future syntax 2023-04-16 18:02:48 +00:00			`function: str, args: list, description: str, model: str \| None = None`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`) -> str:`
			`"""Call an AI function`

			`This is a magic function that can do anything with no-code. See`
			`https://github.com/Torantulino/AI-Functions for more info.`

			`Args:`
			`function (str): The function to call`
			`args (list): The arguments to pass to the function`
			`description (str): The description of the function`
			`model (str, optional): The model to use. Defaults to None.`

			`Returns:`
			`str: The response from the function`
			`"""`
			`if model is None:`
			`model = CFG.smart_llm_model`
			`# For each arg, if any are None, convert to "None":`
			`args = [str(arg) if arg is not None else "None" for arg in args]`
			`# parse args to comma separated string`
:bug: Minor type fixes 2023-04-17 19:42:17 +00:00			`args: str = ", ".join(args)`
			`messages: List[Message] = [`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`{`
			`"role": "system",`
			"content": f"You are now the following python function: ```# {description}"
			f"\n{function}```\n\nOnly respond with your `return` value.",
			`},`
			`{"role": "user", "content": args},`
			`]`

			`return create_chat_completion(model=model, messages=messages, temperature=0)`
Consolidate calls to openai Starting to abstract away the calls to openai 2023-04-03 02:51:07 +00:00
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00
Consolidate calls to openai Starting to abstract away the calls to openai 2023-04-03 02:51:07 +00:00			`# Overly simple abstraction until we create something better`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`# simple retry mechanism when getting a rate error or a bad gateway`
formatting 2023-04-14 19:42:28 +00:00			`def create_chat_completion(`
:bug: Minor type fixes 2023-04-17 19:42:17 +00:00			`messages: List[Message], # type: ignore`
			`model: Optional[str] = None,`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`temperature: float = CFG.temperature,`
:bug: Minor type fixes 2023-04-17 19:42:17 +00:00			`max_tokens: Optional[int] = None,`
formatting 2023-04-14 19:42:28 +00:00			`) -> str:`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`"""Create a chat completion using the OpenAI API`

			`Args:`
:bug: Minor type fixes 2023-04-17 19:42:17 +00:00			`messages (List[Message]): The messages to send to the chat completion`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`model (str, optional): The model to use. Defaults to None.`
			`temperature (float, optional): The temperature to use. Defaults to 0.9.`
			`max_tokens (int, optional): The max tokens to use. Defaults to None.`

			`Returns:`
			`str: The response from the chat completion`
			`"""`
			`num_retries = 10`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`warned_user = False`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`if CFG.debug_mode:`
Fix everything (#1444) * Pi's message. * Fix most everything. * Blacked 2023-04-15 00:04:48 +00:00			`print(`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`f"{Fore.GREEN}Creating chat completion with model {model}, temperature {temperature}, max_tokens {max_tokens}{Fore.RESET}"`
Fix everything (#1444) * Pi's message. * Fix most everything. * Blacked 2023-04-15 00:04:48 +00:00			`)`
Add hooks for chat completion 2023-04-17 04:30:42 +00:00			`for plugin in CFG.plugins:`
			`if plugin.can_handle_chat_completion(`
			`messages=messages,`
			`model=model,`
			`temperature=temperature,`
			`max_tokens=max_tokens,`
			`):`
Fix all commands and cleanup 2023-04-19 23:17:04 +00:00			`message = plugin.handle_chat_completion(`
Add hooks for chat completion 2023-04-17 04:30:42 +00:00			`messages=messages,`
			`model=model,`
			`temperature=temperature,`
			`max_tokens=max_tokens,`
			`)`
Fix all commands and cleanup 2023-04-19 23:17:04 +00:00			`if message is not None:`
			`return message`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`response = None`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`for attempt in range(num_retries):`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`backoff = 2 ** (attempt + 2)`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`try:`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`if CFG.use_azure:`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`response = openai.ChatCompletion.create(`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`deployment_id=CFG.get_azure_deployment_id_for_model(model),`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`model=model,`
			`messages=messages,`
			`temperature=temperature,`
formatting 2023-04-14 19:42:28 +00:00			`max_tokens=max_tokens,`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`)`
			`else:`
			`response = openai.ChatCompletion.create(`
			`model=model,`
			`messages=messages,`
			`temperature=temperature,`
formatting 2023-04-14 19:42:28 +00:00			`max_tokens=max_tokens,`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`)`
			`break`
Fix everything (#1444) * Pi's message. * Fix most everything. * Blacked 2023-04-15 00:04:48 +00:00			`except RateLimitError:`
in debug mode add a log about rate limit error 2023-04-15 19:06:27 +00:00			`if CFG.debug_mode:`
:recycle: Use AutoGPT template package for the plugin type 2023-04-18 05:10:40 +00:00			`print(`
			`f"{Fore.RED}Error: ", f"Reached rate limit, passing...{Fore.RESET}"`
			`)`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`if not warned_user:`
			`logger.double_check(`
isort implemented 2023-04-17 20:41:42 +00:00			`f"Please double check that you have setup a {Fore.CYAN + Style.BRIGHT}PAID{Style.RESET_ALL} OpenAI API Account. "`
			`+ f"You can read more here: {Fore.CYAN}https://github.com/Significant-Gravitas/Auto-GPT#openai-api-keys-configuration{Fore.RESET}"`
			`)`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`warned_user = True`
Fix everything (#1444) * Pi's message. * Fix most everything. * Blacked 2023-04-15 00:04:48 +00:00			`except APIError as e:`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`if e.http_status != 502:`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`raise`
			`if attempt == num_retries - 1:`
			`raise`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`if CFG.debug_mode:`
			`print(`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`f"{Fore.RED}Error: ",`
			`f"API Bad gateway. Waiting {backoff} seconds...{Fore.RESET}",`
Reorg (#1537) * Pi's message. * Fix most everything. * Blacked * Add Typing, Docstrings everywhere, organize the code a bit. * Black * fix import * Update message, dedupe. * Increase backoff time. * bump up retries 2023-04-15 12:56:23 +00:00			`)`
			`time.sleep(backoff)`
Added simple retry on Open AI chat if a Rate Limit or 502 Bad Gateway error received 2023-04-13 16:23:16 +00:00			`if response is None:`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`logger.typewriter_log(`
Fix linter issues 2023-04-16 19:16:43 +00:00			`"FAILED TO GET RESPONSE FROM OPENAI",`
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`Fore.RED,`
isort implemented 2023-04-17 20:41:42 +00:00			`"Auto-GPT has failed to get a response from OpenAI's services. "`
			+ f"Try running Auto-GPT again, and if the problem the persists try running it with `{Fore.CYAN}--debug{Fore.RESET}`.",
Improve the error logging for OAI Issues 2023-04-16 19:10:48 +00:00			`)`
			`logger.double_check()`
			`if CFG.debug_mode:`
			`raise RuntimeError(f"Failed to get response after {num_retries} retries")`
			`else:`
			`quit(1)`
Merge branch 'master' of https://github.com/Significant-Gravitas/Auto-GPT into plugin-support 2023-04-16 02:37:27 +00:00			`resp = response.choices[0].message["content"]`
			`for plugin in CFG.plugins:`
Add early abort functions. 2023-04-17 04:39:33 +00:00			`if not plugin.can_handle_on_response():`
			`continue`
Merge branch 'master' of https://github.com/Significant-Gravitas/Auto-GPT into plugin-support 2023-04-16 02:37:27 +00:00			`resp = plugin.on_response(resp)`
			`return resp`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00

Update llm_utils.py Fix trailing whitespace 2023-04-15 20:03:03 +00:00			`def create_embedding_with_ada(text) -> list:`
Spelling fixes 2023-04-17 12:25:49 +00:00			`"""Create an embedding with text-ada-002 using the OpenAI SDK"""`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00			`num_retries = 10`
			`for attempt in range(num_retries):`
			`backoff = 2 ** (attempt + 2)`
			`try:`
			`if CFG.use_azure:`
Blacked. 2023-04-15 21:40:12 +00:00			`return openai.Embedding.create(`
			`input=[text],`
			`engine=CFG.get_azure_deployment_id_for_model(`
			`"text-embedding-ada-002"`
			`),`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00			`)["data"][0]["embedding"]`
			`else:`
Blacked. 2023-04-15 21:40:12 +00:00			`return openai.Embedding.create(`
			`input=[text], model="text-embedding-ada-002"`
			`)["data"][0]["embedding"]`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00			`except RateLimitError:`
			`pass`
			`except APIError as e:`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`if e.http_status != 502:`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00			`raise`
			`if attempt == num_retries - 1:`
			`raise`
			`if CFG.debug_mode:`
			`print(`
'Refactored by Sourcery' 2023-04-17 19:44:54 +00:00			`f"{Fore.RED}Error: ",`
			`f"API Bad gateway. Waiting {backoff} seconds...{Fore.RESET}",`
Embedding Improvement 1. move embedding function into llm_utils 2. add try feature with in embedding function 2023-04-15 16:13:29 +00:00			`)`
			`time.sleep(backoff)`