Implement CoT no-op for reasoning models

FireMasterK · FireMasterK · commit 19eb50b90b59 · 2025-06-24T17:34:12.000+05:30
diff --git a/dspy/clients/lm.py b/dspy/clients/lm.py
@@ -37,6 +37,7 @@ def __init__(
         callbacks: Optional[List[BaseCallback]] = None,
         num_retries: int = 3,
         provider: Optional[Provider] = None,
+        reasoning_model: Optional[bool] = None,
         finetuning_model: Optional[str] = None,
         launch_kwargs: Optional[dict[str, Any]] = None,
         train_kwargs: Optional[dict[str, Any]] = None,
@@ -51,6 +52,7 @@ def __init__(
             model_type: The type of the model, either ``"chat"`` or ``"text"``.
             temperature: The sampling temperature to use when generating responses.
             max_tokens: The maximum number of tokens to generate per response.
+            reasoning_model: Whether the model is a reasoning model.
             cache: Whether to cache the model responses for reuse to improve performance
                    and reduce costs.
             cache_in_memory (deprecated): To enable additional caching with LRU in memory.
@@ -71,6 +73,7 @@ def __init__(
         self.callbacks = callbacks or []
         self.history = []
         self.num_retries = num_retries
+        self.reasoning_model = reasoning_model if reasoning_model is not None else litellm.supports_reasoning(model)
         self.finetuning_model = finetuning_model
         self.launch_kwargs = launch_kwargs or {}
         self.train_kwargs = train_kwargs or {}
diff --git a/dspy/predict/chain_of_thought.py b/dspy/predict/chain_of_thought.py
@@ -27,12 +27,15 @@ def __init__(
         """
         super().__init__()
         signature = ensure_signature(signature)
-        prefix = "Reasoning: Let's think step by step in order to"
-        desc = "${reasoning}"
-        rationale_field_type = rationale_field.annotation if rationale_field else rationale_field_type
-        rationale_field = rationale_field if rationale_field else dspy.OutputField(prefix=prefix, desc=desc)
-        extended_signature = signature.prepend(name="reasoning", field=rationale_field, type_=rationale_field_type)
-        self.predict = dspy.Predict(extended_signature, **config)
+        if dspy.settings.lm.reasoning_model:
+            self.predict = dspy.Predict(signature, **config)
+        else:
+            prefix = "Reasoning: Let's think step by step in order to"
+            desc = "${reasoning}"
+            rationale_field_type = rationale_field.annotation if rationale_field else rationale_field_type
+            rationale_field = rationale_field if rationale_field else dspy.OutputField(prefix=prefix, desc=desc)
+            extended_signature = signature.prepend(name="reasoning", field=rationale_field, type_=rationale_field_type)
+            self.predict = dspy.Predict(extended_signature, **config)
 
     def forward(self, **kwargs):
         return self.predict(**kwargs)
diff --git a/pyproject.toml b/pyproject.toml
@@ -32,7 +32,7 @@ dependencies = [
     "optuna>=3.4.0",
     "pydantic>=2.0",
     "magicattr>=0.1.6",
-    "litellm>=1.64.0",
+    "litellm>=1.72.4",
     "diskcache>=5.6.0",
     "json-repair>=0.30.0",
     "tenacity>=8.2.3",
@@ -59,8 +59,8 @@ dev = [
     "pillow>=10.1.0",
     "datamodel_code_generator>=0.26.3",
     "build>=1.0.3",
-    "litellm>=1.64.0; sys_platform == 'win32'",
-    "litellm[proxy]>=1.64.0; sys_platform != 'win32'",
+    "litellm>=1.72.4; sys_platform == 'win32'",
+    "litellm[proxy]>=1.72.4; sys_platform != 'win32'",
 ]
 test_extras = [
     "mcp; python_version >= '3.10'",
diff --git a/tests/predict/test_chain_of_thought.py b/tests/predict/test_chain_of_thought.py
@@ -23,3 +23,15 @@ async def test_async_chain_of_thought():
         program = ChainOfThought("question -> answer")
         result = await program.acall(question="What is 1+1?")
         assert result.answer == "2"
+
+
+def test_cot_skips_with_reasoning_model():
+    lm = DummyLM([{"answer": "2"}])
+    lm.reasoning_model = True
+    dspy.settings.configure(lm=lm)
+    signature = dspy.Signature("question -> answer")
+    predict = ChainOfThought(signature)
+    assert list(predict.predict.signature.output_fields.keys()) == [
+        "answer",
+    ]
+    assert predict(question="What is 1+1?").answer == "2"
diff --git a/uv.lock b/uv.lock