Nathan Weinshenker
--- a/tests/chat/test_agent_react.py
+++ b/tests/chat/test_agent_react.py

        for msg in prompt_value.messages:
            if isinstance(msg, SystemMessage):
-                if feature_flag_enabled:
+                if feature_flag_enabled and not mock_config.custom_models.enabled:
                    content_dict = msg.content[0]
                    assert content_dict["type"] == "text"
                    assert content_dict["cache_control"] == {"type": "ephemeral"}
-                if feature_flag_enabled and not mock_config.custom_models.enabled:
-                    content_dict = msg.content[0]
-                    assert content_dict["type"] == "text"
-                    assert content_dict["cache_control"] == {"type": "ephemeral"}
+                if feature_flag_enabled and not mock_config.custom_models.enabled:
+                    content_dict = msg.content[0]
+                    assert isinstance(content_dict, dict)
+                    assert content_dict["type"] == "text"
+                    assert content_dict["cache_control"] == {"type": "ephemeral"}
--- a/tests/chat/test_agent_react.py
+++ b/tests/chat/test_agent_react.py
        assert cap_logs[-1]["event"] == "Response streaming"

    @pytest.mark.asyncio
-    @pytest.mark.parametrize("feature_flag_enabled", [True, False])
-    async def test_stream_message_cache_control(
-        self,
-        prompt: ReActAgent,
-        feature_flag_enabled: bool,
+    @pytest.mark.parametrize(