Fix Celery SoftTimeLimitExceeded exception handling

yashwantbezawada · yashwantbezawada · commit 1721d582af15 · 2025-11-07T10:50:21.000-06:00
When using the OpenAI client in Celery tasks with soft time limits, the client's broad exception handling was catching SoftTimeLimitExceeded and treating it as a retryable connection error. This prevented Celery tasks from properly handling timeouts and running cleanup logic. This change adds a check to identify termination signals (like Celery's SoftTimeLimitExceeded or asyncio's CancelledError) and re-raises them immediately without retry. This allows task executors to properly handle these signals. Changes: - Added _should_not_retry() helper to identify termination signals - Modified sync and async exception handlers to check before retrying - Added test to verify termination signals are not retried Fixes #2737
diff --git a/src/openai/_base_client.py b/src/openai/_base_client.py
@@ -88,6 +88,36 @@
 log: logging.Logger = logging.getLogger(__name__)
 log.addFilter(SensitiveHeadersFilter())
 
+
+def _should_not_retry(exc: Exception) -> bool:
+    """
+    Check if an exception should propagate immediately without retry.
+
+    This includes task cancellation signals from async frameworks
+    and task executors like Celery that should not be caught and retried.
+
+    Args:
+        exc: The exception to check
+
+    Returns:
+        True if the exception should propagate without retry, False otherwise
+    """
+    exc_class = exc.__class__
+    exc_module = exc_class.__module__
+    exc_name = exc_class.__name__
+
+    # Celery task termination (don't import celery - check by name)
+    # Examples: SoftTimeLimitExceeded, TimeLimitExceeded, Terminated
+    if exc_module.startswith("celery") and ("Limit" in exc_name or "Terminated" in exc_name):
+        return True
+
+    # asyncio cancellation
+    if exc_module == "asyncio" and exc_name == "CancelledError":
+        return True
+
+    return False
+
+
 # TODO: make base page type vars covariant
 SyncPageT = TypeVar("SyncPageT", bound="BaseSyncPage[Any]")
 AsyncPageT = TypeVar("AsyncPageT", bound="BaseAsyncPage[Any]")
@@ -1001,6 +1031,10 @@ def request(
             except Exception as err:
                 log.debug("Encountered Exception", exc_info=True)
 
+                # Check if this is a termination signal that should not be retried
+                if _should_not_retry(err):
+                    raise
+
                 if remaining_retries > 0:
                     self._sleep_for_retry(
                         retries_taken=retries_taken,
@@ -1548,6 +1582,10 @@ async def request(
             except Exception as err:
                 log.debug("Encountered Exception", exc_info=True)
 
+                # Check if this is a termination signal that should not be retried
+                if _should_not_retry(err):
+                    raise
+
                 if remaining_retries > 0:
                     await self._sleep_for_retry(
                         retries_taken=retries_taken,
diff --git a/tests/test_client.py b/tests/test_client.py
@@ -885,6 +885,37 @@ def retry_handler(_request: httpx.Request) -> httpx.Response:
 
         assert response.http_request.headers.get("x-stainless-retry-count") == "42"
 
+    @mock.patch("openai._base_client.BaseClient._calculate_retry_timeout", _low_retry_timeout)
+    @pytest.mark.respx(base_url=base_url)
+    def test_termination_signal_not_retried(self, respx_mock: MockRouter, client: OpenAI) -> None:
+        """Test that termination signals (like Celery's SoftTimeLimitExceeded) are not retried."""
+        client = client.with_options(max_retries=3)
+
+        # Create a mock exception that mimics Celery's SoftTimeLimitExceeded
+        class MockCelerySoftTimeLimitExceeded(Exception):
+            """Mock of celery.exceptions.SoftTimeLimitExceeded"""
+
+            __module__ = "celery.exceptions"
+            __name__ = "SoftTimeLimitExceeded"
+
+        # Mock the request to raise our termination signal
+        respx_mock.post("/chat/completions").mock(side_effect=MockCelerySoftTimeLimitExceeded("Time limit exceeded"))
+
+        # Verify the exception propagates without retry
+        with pytest.raises(MockCelerySoftTimeLimitExceeded):
+            client.chat.completions.create(
+                messages=[
+                    {
+                        "content": "string",
+                        "role": "developer",
+                    }
+                ],
+                model="gpt-4o",
+            )
+
+        # Verify only one attempt was made (no retries)
+        assert len(respx_mock.calls) == 1
+
     @pytest.mark.parametrize("failures_before_success", [0, 2, 4])
     @mock.patch("openai._base_client.BaseClient._calculate_retry_timeout", _low_retry_timeout)
     @pytest.mark.respx(base_url=base_url)