OpenHands · ak684 · Oct 30, 2025 · Oct 30, 2025 · Oct 30, 2025 · Oct 31, 2025
diff --git a/openhands-sdk/openhands/sdk/llm/__init__.py b/openhands-sdk/openhands/sdk/llm/__init__.py
@@ -1,6 +1,7 @@
 from openhands.sdk.llm.llm import LLM
 from openhands.sdk.llm.llm_registry import LLMRegistry, RegistryEvent
 from openhands.sdk.llm.llm_response import LLMResponse
+from openhands.sdk.llm.llm_with_gateway import LLMWithGateway
 from openhands.sdk.llm.message import (
     ImageContent,
     Message,
@@ -23,6 +24,7 @@
 __all__ = [
     "LLMResponse",
     "LLM",
+    "LLMWithGateway",
     "LLMRegistry",
     "RouterLLM",
     "RegistryEvent",

diff --git a/openhands-sdk/openhands/sdk/llm/llm.py b/openhands-sdk/openhands/sdk/llm/llm.py
@@ -162,6 +162,14 @@ class LLM(BaseModel, RetryMixin, NonNativeToolCallingMixin):
     )
     ollama_base_url: str | None = Field(default=None)
 
+    ssl_verify: bool | str | None = Field(
+        default=None,
+        description=(
+            "TLS verification forwarded to LiteLLM; "
+            "set to False when corporate proxies break certificate chains."
+        ),
+    )
+
     drop_params: bool = Field(default=True)
     modify_params: bool = Field(
         default=True,
@@ -583,33 +591,35 @@ def responses(
         def _one_attempt(**retry_kwargs) -> ResponsesAPIResponse:
             final_kwargs = {**call_kwargs, **retry_kwargs}
             with self._litellm_modify_params_ctx(self.modify_params):
-                with warnings.catch_warnings():
-                    warnings.filterwarnings("ignore", category=DeprecationWarning)
-                    typed_input: ResponseInputParam | str = (
-                        cast(ResponseInputParam, input_items) if input_items else ""
-                    )
-                    ret = litellm_responses(
-                        model=self.model,
-                        input=typed_input,
-                        instructions=instructions,
-                        tools=resp_tools,
-                        api_key=self.api_key.get_secret_value()
-                        if self.api_key
-                        else None,
-                        api_base=self.base_url,
-                        api_version=self.api_version,
-                        timeout=self.timeout,
-                        drop_params=self.drop_params,
-                        seed=self.seed,
-                        **final_kwargs,
-                    )
-                    assert isinstance(ret, ResponsesAPIResponse), (
-                        f"Expected ResponsesAPIResponse, got {type(ret)}"
-                    )
-                    # telemetry (latency, cost). Token usage mapping we handle after.
-                    assert self._telemetry is not None
-                    self._telemetry.on_response(ret)
-                    return ret
+                with self._litellm_ssl_verify_ctx():
+                    with warnings.catch_warnings():
+                        warnings.filterwarnings("ignore", category=DeprecationWarning)
+                        typed_input: ResponseInputParam | str = (
+                            cast(ResponseInputParam, input_items) if input_items else ""
+                        )
+                        ret = litellm_responses(
+                            model=self.model,
+                            input=typed_input,
+                            instructions=instructions,
+                            tools=resp_tools,
+                            api_key=self.api_key.get_secret_value()
+                            if self.api_key
+                            else None,
+                            api_base=self.base_url,
+                            api_version=self.api_version,
+                            custom_llm_provider=self.custom_llm_provider,
+                            timeout=self.timeout,
+                            drop_params=self.drop_params,
+                            seed=self.seed,
+                            **final_kwargs,
+                        )
+                        assert isinstance(ret, ResponsesAPIResponse), (
+                            f"Expected ResponsesAPIResponse, got {type(ret)}"
+                        )
+                        # telemetry (latency, cost). Token usage mapping we handle after.
+                        assert self._telemetry is not None
+                        self._telemetry.on_response(ret)
+                        return ret
 
         try:
             resp: ResponsesAPIResponse = _one_attempt()
@@ -642,40 +652,45 @@ def _transport_call(
     ) -> ModelResponse:
         # litellm.modify_params is GLOBAL; guard it for thread-safety
         with self._litellm_modify_params_ctx(self.modify_params):
-            with warnings.catch_warnings():
-                warnings.filterwarnings(
-                    "ignore", category=DeprecationWarning, module="httpx.*"
-                )
-                warnings.filterwarnings(
-                    "ignore",
-                    message=r".*content=.*upload.*",
-                    category=DeprecationWarning,
-                )
-                warnings.filterwarnings(
-                    "ignore",
-                    message=r"There is no current event loop",
-                    category=DeprecationWarning,
-                )
-                warnings.filterwarnings(
-                    "ignore",
-                    category=UserWarning,
-                )
-                # Some providers need renames handled in _normalize_call_kwargs.
-                ret = litellm_completion(
-                    model=self.model,
-                    api_key=self.api_key.get_secret_value() if self.api_key else None,
-                    base_url=self.base_url,
-                    api_version=self.api_version,
-                    timeout=self.timeout,
-                    drop_params=self.drop_params,
-                    seed=self.seed,
-                    messages=messages,
-                    **kwargs,
-                )
-                assert isinstance(ret, ModelResponse), (
-                    f"Expected ModelResponse, got {type(ret)}"
-                )
-                return ret
+            with self._litellm_ssl_verify_ctx():
+                with warnings.catch_warnings():
+                    warnings.filterwarnings(
+                        "ignore", category=DeprecationWarning, module="httpx.*"
+                    )
+                    warnings.filterwarnings(
+                        "ignore",
+                        message=r".*content=.*upload.*",
+                        category=DeprecationWarning,
+                    )
+                    warnings.filterwarnings(
+                        "ignore",
+                        message=r"There is no current event loop",
+                        category=DeprecationWarning,
+                    )
+                    warnings.filterwarnings(
+                        "ignore",
+                        category=UserWarning,
+                    )
+                    # Some providers need renames handled in _normalize_call_kwargs.
+                    ret = litellm_completion(
+                        model=self.model,
+                        api_key=self.api_key.get_secret_value()
+                        if self.api_key
+                        else None,
+                        base_url=self.base_url,
+                        api_version=self.api_version,
+                        custom_llm_provider=self.custom_llm_provider,
+                        timeout=self.timeout,
+                        ssl_verify=self.ssl_verify,
+                        drop_params=self.drop_params,
+                        seed=self.seed,
+                        messages=messages,
+                        **kwargs,
+                    )
+                    assert isinstance(ret, ModelResponse), (
+                        f"Expected ModelResponse, got {type(ret)}"
+                    )
+                    return ret
 
     @contextmanager
     def _litellm_modify_params_ctx(self, flag: bool):
@@ -686,6 +701,18 @@ def _litellm_modify_params_ctx(self, flag: bool):
         finally:
             litellm.modify_params = old
 
+    @contextmanager
+    def _litellm_ssl_verify_ctx(self):
+        if self.ssl_verify is None:
+            yield
+            return
+        old = getattr(litellm, "ssl_verify", None)
+        try:
+            litellm.ssl_verify = self.ssl_verify
+            yield
+        finally:
+            litellm.ssl_verify = old
+
     # =========================================================================
     # Capabilities, formatting, and info
     # =========================================================================