Add Handling of Cache Prompt When Formatting Messages (#3773)

* Add Handling of Cache Prompt When Formatting Messages * Fix Value for Cache Control * Fix Value for Cache Control * Update openhands/core/message.py Co-authored-by: Engel Nyst <enyst@users.noreply.github.com> * Fix lint error * Serialize Messages if Propt Caching Is Enabled * Remove formatting message change --------- Co-authored-by: Engel Nyst <enyst@users.noreply.github.com> Co-authored-by: tobitege <10787084+tobitege@users.noreply.github.com>
2026-01-10 23:38:08 -05:00 · 2024-09-10 09:34:41 -07:00
parent 06ed142191
commit 97a03faf33
3 changed files with 11 additions and 4 deletions
--- a/openhands/core/message.py
+++ b/openhands/core/message.py
@@ -72,12 +72,14 @@ class Message(BaseModel):


 def format_messages(
-    messages: Union[Message, list[Message]], with_images: bool
+    messages: Union[Message, list[Message]],
+    with_images: bool,
+    with_prompt_caching: bool,
 ) -> list[dict]:
    if not isinstance(messages, list):
        messages = [messages]

-    if with_images:
+    if with_images or with_prompt_caching:
        return [message.model_dump() for message in messages]

    converted_messages = []
@@ -113,4 +115,5 @@ def format_messages(
                    'content': content_str,
                }
            )
+
    return converted_messages
--- a/openhands/llm/llm.py
+++ b/openhands/llm/llm.py
@@ -597,4 +597,6 @@ class LLM:
    def format_messages_for_llm(
        self, messages: Union[Message, list[Message]]
    ) -> list[dict]:
-        return format_messages(messages, self.vision_is_active())
+        return format_messages(
+            messages, self.vision_is_active(), self.is_caching_prompt_active()
+        )
--- a/tests/integration/conftest.py
+++ b/tests/integration/conftest.py
@@ -185,7 +185,9 @@ def mock_user_response(*args, test_name, **kwargs):
 def mock_completion(*args, test_name, **kwargs):
    global cur_id
    messages = kwargs['messages']
-    plain_messages = format_messages(messages, with_images=False)
+    plain_messages = format_messages(
+        messages, with_images=False, with_prompt_caching=False
+    )
    message_str = message_separator.join(msg['content'] for msg in plain_messages)

    # this assumes all response_(*).log filenames are in numerical order, starting from one