From 227ece590fb58df0df33bc971aa62365ca547ecd Mon Sep 17 00:00:00 2001
From: "mirrobot-agent[bot]" <2140342+mirrobot-agent@users.noreply.github.com>
Date: Mon, 16 Mar 2026 15:48:42 +0000
Subject: [PATCH 1/2] fix: Robust multipart content handling in Gemini CLI
 provider

- Add _parse_content_parts() helper method to properly parse both string and list content formats
- Apply content parsing to system messages to fix Invalid JSON payload error (issue #149)
- Apply content parsing to user and assistant messages for consistency
- Resolve 'can only concatenate str (not list) to str' error (issue #148)
- Ensure compatibility with OpenAI API multipart message format

The fix handles content in both formats:
- Plain string: "Hello"
- Multipart list: [{"type": "text", "text": "Hello"}, {"type": "image_url", ...}]

This matches the implementation in antigravity_provider.py for consistency across providers.
---
 .../providers/gemini_cli_provider.py          | 103 +++++++++++-------
 1 file changed, 62 insertions(+), 41 deletions(-)

diff --git a/src/rotator_library/providers/gemini_cli_provider.py b/src/rotator_library/providers/gemini_cli_provider.py
index 327504d7..bc2394d3 100644
--- a/src/rotator_library/providers/gemini_cli_provider.py
+++ b/src/rotator_library/providers/gemini_cli_provider.py
@@ -624,6 +624,58 @@ def _cli_preview_fallback_order(self, model: str) -> List[str]:
         # Return fallback chain if available, otherwise just return the original model
         return fallback_chains.get(model_name, [model_name])
 
+    def _parse_content_parts(
+        self, content: Any, model: str = ""
+    ) -> List[Dict[str, Any]]:
+        """
+        Parse content into Gemini parts format.
+
+        Handles both string content and multipart list content (text, images, etc.).
+        This ensures compatibility with OpenAI API format where content can be:
+        - A plain string: "Hello"
+        - A list of parts: [{"type": "text", "text": "Hello"}, {"type": "image_url", ...}]
+
+        Args:
+            content: The message content (string or list)
+            model: The model name (for context if needed)
+
+        Returns:
+            List of Gemini parts dictionaries
+        """
+        parts = []
+
+        if isinstance(content, str):
+            if content:
+                parts.append({"text": content})
+        elif isinstance(content, list):
+            for item in content:
+                if item.get("type") == "text":
+                    text = item.get("text", "")
+                    if text:
+                        parts.append({"text": text})
+                elif item.get("type") == "image_url":
+                    image_url = item.get("image_url", {}).get("url", "")
+                    if image_url.startswith("data:"):
+                        try:
+                            header, data = image_url.split(",", 1)
+                            mime_type = header.split(":")[1].split(";")[0]
+                            parts.append(
+                                {
+                                    "inlineData": {
+                                        "mimeType": mime_type,
+                                        "data": data,
+                                    }
+                                }
+                            )
+                        except Exception as e:
+                            lib_logger.warning(f"Failed to parse image data URL: {e}")
+                    else:
+                        lib_logger.warning(
+                            f"Non-data-URL images not supported: {image_url[:50]}..."
+                        )
+
+        return parts
+
     def _transform_messages(
         self, messages: List[Dict[str, Any]], model: str = ""
     ) -> Tuple[Optional[Dict[str, Any]], List[Dict[str, Any]]]:
@@ -645,10 +697,12 @@ def _transform_messages(
         if messages and messages[0].get("role") == "system":
             system_prompt_content = messages.pop(0).get("content", "")
             if system_prompt_content:
-                system_instruction = {
-                    "role": "user",
-                    "parts": [{"text": system_prompt_content}],
-                }
+                system_parts = self._parse_content_parts(system_prompt_content, model)
+                if system_parts:
+                    system_instruction = {
+                        "role": "user",
+                        "parts": system_parts,
+                    }
 
         tool_call_id_to_name = {}
         for msg in messages:
@@ -678,45 +732,12 @@ def _transform_messages(
                 pending_tool_parts = []
 
             if role == "user":
-                if isinstance(content, str):
-                    # Simple text content
-                    if content:
-                        parts.append({"text": content})
-                elif isinstance(content, list):
-                    # Multi-part content (text, images, etc.)
-                    for item in content:
-                        if item.get("type") == "text":
-                            text = item.get("text", "")
-                            if text:
-                                parts.append({"text": text})
-                        elif item.get("type") == "image_url":
-                            # Handle image data URLs
-                            image_url = item.get("image_url", {}).get("url", "")
-                            if image_url.startswith("data:"):
-                                try:
-                                    # Parse: data:image/png;base64,iVBORw0KG...
-                                    header, data = image_url.split(",", 1)
-                                    mime_type = header.split(":")[1].split(";")[0]
-                                    parts.append(
-                                        {
-                                            "inlineData": {
-                                                "mimeType": mime_type,
-                                                "data": data,
-                                            }
-                                        }
-                                    )
-                                except Exception as e:
-                                    lib_logger.warning(
-                                        f"Failed to parse image data URL: {e}"
-                                    )
-                            else:
-                                lib_logger.warning(
-                                    f"Non-data-URL images not supported: {image_url[:50]}..."
-                                )
+                parts = self._parse_content_parts(content, model)
 
             elif role == "assistant":
-                if isinstance(content, str):
-                    parts.append({"text": content})
+                if content:
+                    content_parts = self._parse_content_parts(content, model)
+                    parts.extend(content_parts)
                 if msg.get("tool_calls"):
                     # Track if we've seen the first function call in this message
                     # Per Gemini docs: Only the FIRST parallel function call gets a signature

From cf332c06dce8cf120ab98e1b3ad85499476e7d2e Mon Sep 17 00:00:00 2001
From: "mirrobot-agent[bot]" <2140342+mirrobot-agent@users.noreply.github.com>
Date: Mon, 16 Mar 2026 21:32:34 +0000
Subject: [PATCH 2/2] fix: Add defensive check for non-dict items in content
 parsing

- Skip non-dict items in multipart content lists to prevent AttributeError
- Add warning log when skipping invalid items
- Addresses review comment about unhandled edge cases

This is a defensive improvement unrelated to the RooCode issue.
---
 src/rotator_library/providers/gemini_cli_provider.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/rotator_library/providers/gemini_cli_provider.py b/src/rotator_library/providers/gemini_cli_provider.py
index bc2394d3..700e05e3 100644
--- a/src/rotator_library/providers/gemini_cli_provider.py
+++ b/src/rotator_library/providers/gemini_cli_provider.py
@@ -649,6 +649,11 @@ def _parse_content_parts(
                 parts.append({"text": content})
         elif isinstance(content, list):
             for item in content:
+                if not isinstance(item, dict):
+                    lib_logger.warning(
+                        f"Skipping non-dict item in content list: {type(item).__name__}"
+                    )
+                    continue
                 if item.get("type") == "text":
                     text = item.get("text", "")
                     if text: