fix: Orient dataframe JSON row-wise & support more data-frame types (#183)

cpsievert · web-flow · commit 44cb1c395d18 · 2025-09-26T18:18:33.000-05:00
* Close #180: Improved ContentToolResult() handling for data frames * Update test; tweak changelog
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -9,6 +9,10 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## [UNRELEASED]
 
+### Improvements
+
+* `ContentToolResult`'s `.get_model_value()` method now calls `.to_json(orient="record")` (instead of `.to_json()`) when relevant. As a result, if a tool call returns a Pandas `DataFrame` (or similar), the model now receives a less confusing (and smaller) JSON format. (#183)
+
 ### Bug fixes
 
 * `ChatAzureOpenAI()` and `ChatDatabricks()` now work as expected when a `OPENAI_API_KEY` environment variable isn't present. (#185)
diff --git a/chatlas/_content.py b/chatlas/_content.py
@@ -1,7 +1,9 @@
 from __future__ import annotations
 
+import inspect
+import warnings
 from pprint import pformat
-from typing import TYPE_CHECKING, Any, Literal, Optional, Union
+from typing import TYPE_CHECKING, Any, Literal, Optional, Union, cast
 
 import orjson
 from pydantic import BaseModel, ConfigDict
@@ -465,8 +467,36 @@ def get_model_value(self) -> object:
 
     @staticmethod
     def _to_json(value: Any) -> object:
+        if hasattr(value, "to_pandas") and callable(value.to_pandas):
+            # Many (most?) df libs (polars, pyarrow, ...) have a .to_pandas()
+            # method, and pandas has a .to_json() method
+            value = value.to_pandas()
+
         if hasattr(value, "to_json") and callable(value.to_json):
-            return value.to_json()
+            # pandas defaults to "columns", which is not ideal for LLMs
+            # https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.to_json.html
+            sig = inspect.signature(value.to_json)
+            if "orient" in list(sig.parameters.keys()):
+                return value.to_json(orient="records")
+            else:
+                return value.to_json()
+
+        # Support for df libs (beyond those with a .to_pandas() method)
+        if hasattr(value, "__narwhals_dataframe__"):
+            try:
+                import narwhals
+
+                val = cast(narwhals.DataFrame, narwhals.from_native(value))
+                return val.to_pandas().to_json(orient="records")
+            except ImportError:
+                warnings.warn(
+                    f"Tool result object of type {type(value)} appears to be a "
+                    "narwhals-compatible DataFrame. If you run into issues with "
+                    "the LLM not understanding this value, try installing narwhals: "
+                    "`pip install narwhals`.",
+                    ImportWarning,
+                    stacklevel=2,
+                )
 
         if hasattr(value, "to_dict") and callable(value.to_dict):
             value = value.to_dict()
diff --git a/pyproject.toml b/pyproject.toml
@@ -48,7 +48,11 @@ dev = [
     "matplotlib",
     "Pillow",
     "shiny",
+    "htmltools",
     "shinychat",
+    "narwhals",
+    "pandas",
+    "polars",
     "openai",
     "anthropic[bedrock]",
     "google-genai>=1.14.0",
@@ -58,7 +62,6 @@ dev = [
     "snowflake-ml-python>=1.8.4",
     # torch (a dependency of snowflake-ml-python) is not yet compatible with Python >3.11
     "torch;python_version<='3.11'",
-    "htmltools",
     "tenacity"
 ]
 docs = [
diff --git a/tests/test_content_tools.py b/tests/test_content_tools.py
@@ -1,5 +1,7 @@
 from typing import Any, Optional, Union
+from unittest.mock import Mock
 
+import orjson
 import pytest
 
 from chatlas import ChatOpenAI
@@ -403,3 +405,93 @@ def add(x: int, y: int) -> int:
     assert parsed.tool is not None
     assert parsed.tool.name == "add"
     assert parsed.tool.description == "Add two numbers"
+
+
+def test_content_tool_result_pandas_dataframe():
+    """Test ContentToolResult with pandas DataFrame using orient='records'"""
+    pandas = pytest.importorskip("pandas")
+
+    # Create a simple pandas DataFrame
+    df = pandas.DataFrame(
+        {"name": ["Alice", "Bob"], "age": [25, 30], "city": ["New York", "London"]}
+    )
+
+    # Create ContentToolResult with DataFrame value
+    result = ContentToolResult(value=df).get_model_value()
+    expected = df.to_json(orient="records")
+    assert result == expected
+
+    parsed = orjson.loads(str(result))
+    assert isinstance(parsed, list)
+    assert len(parsed) == 2
+    assert parsed[0] == {"name": "Alice", "age": 25, "city": "New York"}
+    assert parsed[1] == {"name": "Bob", "age": 30, "city": "London"}
+
+
+def test_content_tool_result_object_with_to_pandas():
+    """Test ContentToolResult with objects that have .to_pandas() method"""
+    pandas = pytest.importorskip("pandas")
+
+    # Create mock object with to_pandas method (like Polars, PyArrow)
+    mock_df_lib = Mock()
+    pandas_df = pandas.DataFrame({"x": [1, 2, 3], "y": ["a", "b", "c"]})
+    mock_df_lib.to_pandas.return_value = pandas_df
+
+    result = ContentToolResult(value=mock_df_lib).get_model_value()
+    mock_df_lib.to_pandas.assert_called_once()
+    expected = pandas_df.to_json(orient="records")
+    assert result == expected
+
+
+def test_content_tool_result_narwhals_dataframe():
+    """Test ContentToolResult with narwhals DataFrame"""
+    narwhals = pytest.importorskip("narwhals")
+    pandas = pytest.importorskip("pandas")
+
+    pandas_df = pandas.DataFrame({"a": [1, 2], "b": ["x", "y"]})
+    nw_df = narwhals.from_native(pandas_df)
+    result = ContentToolResult(value=nw_df).get_model_value()
+    expected = pandas_df.to_json(orient="records")
+    assert result == expected
+
+
+def test_content_tool_result_object_with_to_dict():
+    """Test ContentToolResult with objects that have to_dict method"""
+    # Mock object with to_dict method but no to_pandas or to_json
+    mock_obj = Mock(spec=["to_dict"])
+    mock_obj.to_dict.return_value = {"key": "value"}
+    result = ContentToolResult(value=mock_obj).get_model_value()
+    mock_obj.to_dict.assert_called_once()
+    # Result should be JSON string representation (orjson format)
+    assert result == '{"key":"value"}'
+
+
+def test_content_tool_result_string_passthrough():
+    """Test ContentToolResult with string values (special case - passed through as-is)"""
+    result = ContentToolResult(value="plain string").get_model_value()
+    assert result == "plain string"
+
+
+def test_content_tool_result_fallback_serialization():
+    """Test ContentToolResult fallback for objects without special methods"""
+    # Regular object without to_json, to_pandas, or to_dict (non-string to avoid the string special case)
+    result = ContentToolResult(value={"key": "value"}).get_model_value()
+    assert result == '{"key":"value"}'
+
+
+def test_content_tool_result_explicit_json_mode():
+    """Test ContentToolResult with explicit JSON mode forces _to_json for non-strings"""
+    # Test with non-string object and explicit JSON mode
+    result = ContentToolResult(
+        value={"key": "value"},
+        model_format="json",
+    ).get_model_value()
+    # With explicit JSON mode, objects get JSON-encoded
+    assert result == '{"key":"value"}'
+    # Test that strings still get special treatment even in JSON mode
+    string_result = ContentToolResult(
+        value="plain string",
+        model_format="json",
+    ).get_model_value()
+    # Strings are still returned as-is even in JSON mode (current behavior)
+    assert string_result == "plain string"
diff --git a/tests/test_tokens.py b/tests/test_tokens.py
@@ -70,7 +70,7 @@ def test_token_count_method():
     chat = ChatAnthropic(model="claude-3-5-sonnet-20241022")
     assert chat.token_count("What is 1 + 1?") == 16
 
-    chat = ChatGoogle(model="gemini-1.5-flash")
+    chat = ChatGoogle(model="gemini-2.5-flash")
     assert chat.token_count("What is 1 + 1?") == 9