Pickle-Pixel · YuHuang0525 · Mar 14, 2026
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,13 @@ All notable changes to ApplyPilot will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.1.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [Unreleased]
+
+### Fixed
+- **OpenAI newer models (gpt-4.1+, gpt-5.x, o-series) rejected with HTTP 400** — these models
+  require `max_completion_tokens` instead of the legacy `max_tokens` parameter. `_chat_compat()`
+  now detects the model prefix and sends the correct parameter automatically.
+
 ## [0.2.0] - 2026-02-17
 
 ### Added

diff --git a/src/applypilot/llm.py b/src/applypilot/llm.py
@@ -157,11 +157,20 @@ def _chat_compat(
         if self.api_key:
             headers["Authorization"] = f"Bearer {self.api_key}"
 
+        # Newer OpenAI models (gpt-4.1+, gpt-5.x, o-series) require
+        # max_completion_tokens instead of the legacy max_tokens parameter.
+        # Sending max_tokens to these models returns HTTP 400.
+        _new_param_models = ("gpt-4.1", "gpt-5", "o1", "o3", "o4")
+        if any(self.model.startswith(p) for p in _new_param_models):
+            token_param: dict[str, int] = {"max_completion_tokens": max_tokens}
+        else:
+            token_param = {"max_tokens": max_tokens}
+
         payload = {
             "model": self.model,
             "messages": messages,
             "temperature": temperature,
-            "max_tokens": max_tokens,
+            **token_param,
         }
 
         resp = self._client.post(