Include the token length of the current summary (#4670)

Co-authored-by: merwanehamadi <merwanehamadi@gmail.com>
2023-06-13 08:29:11 +09:00 · 2023-06-13 08:29:11 +09:00 · 7bf39cbb72
parent f277e6aa2d
commit 7bf39cbb72
1 changed files with 8 additions and 1 deletions
--- a/autogpt/memory/message_history.py
+++ b/autogpt/memory/message_history.py
@ -174,6 +174,7 @@ class MessageHistory:
        # TODO make this default dynamic
        prompt_template_length = 100
        max_tokens = OPEN_AI_CHAT_MODELS.get(cfg.fast_llm_model).max_tokens
+        summary_tlength = count_string_tokens(str(self.summary), cfg.fast_llm_model)
        batch = []
        batch_tlength = 0

@ -181,9 +182,15 @@ class MessageHistory:
        for event in new_events:
            event_tlength = count_string_tokens(str(event), cfg.fast_llm_model)

-            if batch_tlength + event_tlength > max_tokens - prompt_template_length:
+            if (
+                batch_tlength + event_tlength
+                > max_tokens - prompt_template_length - summary_tlength
+            ):
                # The batch is full. Summarize it and start a new one.
                self.summarize_batch(batch, cfg)
+                summary_tlength = count_string_tokens(
+                    str(self.summary), cfg.fast_llm_model
+                )
                batch = [event]
                batch_tlength = event_tlength
            else: