basetenlabs · cretz · May 6, 2026 · May 5, 2026 · marius-baseten · May 5, 2026
diff --git a/baseten/client/_inference.py b/baseten/client/_inference.py
@@ -1,11 +1,13 @@
 from __future__ import annotations
 
+from collections.abc import Mapping
 from dataclasses import dataclass
 from typing import Any
 
 import httpx
 
 import baseten.client.inferenceapi
+from baseten.client._user_agent import with_user_agent
 
 
 @dataclass(frozen=True)
@@ -19,6 +21,9 @@ class InferenceClientOptions:
     api_key: str
     """API key for authentication."""
 
+    headers: Mapping[str, str] | None = None
+    """Additional headers to send on every request."""
+
     model_id: str | None = None
     """Model ID. Mutually exclusive with *chain_id*."""
 
@@ -84,48 +89,56 @@ def __init__(
         self,
         *,
         api_key: str,
+        headers: Mapping[str, str] | None = None,
         model_id: str | None = None,
         chain_id: str | None = None,
         environment: str | None = None,
         base_url_override: str | None = None,
-        http_client: httpx.Client | None = None,
+        http_client_override: httpx.Client | None = None,
         close_http_client_on_close: bool | None = None,
     ) -> None:
         """Create a new synchronous inference client.
 
         Args:
             api_key: API key for authentication.
+            headers: Additional headers to send on every request.
             model_id: Model ID. Mutually exclusive with *chain_id*.
             chain_id: Chain ID. Mutually exclusive with *model_id*.
             environment: Environment name for regional routing (e.g. ``"production"``).
             base_url_override: Override the computed base URL. When set,
                 *model_id*, *chain_id*, and *environment* are ignored.
-            http_client: Pre-configured httpx client. When provided, the
-                caller is responsible for setting base URL and auth headers.
+            http_client_override: Pre-configured httpx client. When provided,
+                the caller is responsible for setting base URL and all
+                headers.
             close_http_client_on_close: Whether :meth:`close` should close
                 the underlying HTTP client. Defaults to ``True`` when the
-                client is created internally, ``False`` when *http_client*
-                is provided.
+                client is created internally, ``False`` when
+                *http_client_override* is provided.
         """
         self._options = InferenceClientOptions(
             api_key=api_key,
+            headers=headers,
             model_id=model_id,
             chain_id=chain_id,
             environment=environment,
             base_url_override=base_url_override,
         )
-        if http_client is None:
+        if http_client_override is None:
+            request_headers: dict[str, str] = {**(headers or {})}
+            # Empty api_key is an advanced opt-out from sending Authorization.
+            if api_key != "":
+                request_headers["Authorization"] = f"Api-Key {api_key}"
             self._http_client = httpx.Client(
                 base_url=self._options.base_url,
-                headers={"Authorization": f"Api-Key {api_key}"},
+                headers=with_user_agent(request_headers),
             )
             self.close_http_client_on_close = (
                 True
                 if close_http_client_on_close is None
                 else close_http_client_on_close
             )
         else:
-            self._http_client = http_client
+            self._http_client = http_client_override
             self.close_http_client_on_close = (
                 False
                 if close_http_client_on_close is None
@@ -191,49 +204,56 @@ def __init__(
         self,
         *,
         api_key: str,
+        headers: Mapping[str, str] | None = None,
         model_id: str | None = None,
         chain_id: str | None = None,
         environment: str | None = None,
         base_url_override: str | None = None,
-        http_client: httpx.AsyncClient | None = None,
+        http_client_override: httpx.AsyncClient | None = None,
         close_http_client_on_close: bool | None = None,
     ) -> None:
         """Create a new asynchronous inference client.
 
         Args:
             api_key: API key for authentication.
+            headers: Additional headers to send on every request.
             model_id: Model ID. Mutually exclusive with *chain_id*.
             chain_id: Chain ID. Mutually exclusive with *model_id*.
             environment: Environment name for regional routing (e.g. ``"production"``).
             base_url_override: Override the computed base URL. When set,
                 *model_id*, *chain_id*, and *environment* are ignored.
-            http_client: Pre-configured httpx async client. When provided,
-                the caller is responsible for setting base URL and auth
-                headers.
+            http_client_override: Pre-configured httpx async client. When
+                provided, the caller is responsible for setting base URL
+                and all headers.
             close_http_client_on_close: Whether :meth:`close` should close
                 the underlying HTTP client. Defaults to ``True`` when the
-                client is created internally, ``False`` when *http_client*
-                is provided.
+                client is created internally, ``False`` when
+                *http_client_override* is provided.
         """
         self._options = InferenceClientOptions(
             api_key=api_key,
+            headers=headers,
             model_id=model_id,
             chain_id=chain_id,
             environment=environment,
             base_url_override=base_url_override,
         )
-        if http_client is None:
+        if http_client_override is None:
+            request_headers: dict[str, str] = {**(headers or {})}
+            # Empty api_key is an advanced opt-out from sending Authorization.
+            if api_key != "":
+                request_headers["Authorization"] = f"Api-Key {api_key}"
             self._http_client = httpx.AsyncClient(
                 base_url=self._options.base_url,
-                headers={"Authorization": f"Api-Key {api_key}"},
+                headers=with_user_agent(request_headers),
             )
             self.close_http_client_on_close = (
                 True
                 if close_http_client_on_close is None
                 else close_http_client_on_close
             )
         else:
-            self._http_client = http_client
+            self._http_client = http_client_override
             self.close_http_client_on_close = (
                 False
                 if close_http_client_on_close is None

diff --git a/baseten/client/_management.py b/baseten/client/_management.py
@@ -1,11 +1,13 @@
 from __future__ import annotations
 
+from collections.abc import Mapping
 from dataclasses import dataclass
 from typing import Any
 
 import httpx
 
 import baseten.client.managementapi
+from baseten.client._user_agent import with_user_agent
 
 
 @dataclass(frozen=True)
@@ -19,6 +21,9 @@ class ManagementClientOptions:
     api_key: str
     """API key for authentication."""
 
+    headers: Mapping[str, str] | None = None
+    """Additional headers to send on every request."""
+
     base_url_override: str | None = None
     """Explicit base URL override, or ``None`` to use the default."""
 
@@ -46,38 +51,45 @@ def __init__(
         self,
         *,
         api_key: str,
+        headers: Mapping[str, str] | None = None,
         base_url_override: str | None = None,
-        http_client: httpx.Client | None = None,
+        http_client_override: httpx.Client | None = None,
         close_http_client_on_close: bool | None = None,
     ) -> None:
         """Create a new synchronous management client.
 
         Args:
             api_key: API key for authentication.
+            headers: Additional headers to send on every request.
             base_url_override: Override the default base URL. When ``None``,
                 :meth:`default_base_url` is used.
-            http_client: Pre-configured httpx client. When provided, the
-                caller is responsible for setting base URL and auth headers.
+            http_client_override: Pre-configured httpx client. When provided,
+                the caller is responsible for setting base URL and all
+                headers.
             close_http_client_on_close: Whether :meth:`close` should close
                 the underlying HTTP client. Defaults to ``True`` when the
-                client is created internally, ``False`` when *http_client*
-                is provided.
+                client is created internally, ``False`` when
+                *http_client_override* is provided.
         """
         self._options = ManagementClientOptions(
-            api_key=api_key, base_url_override=base_url_override
+            api_key=api_key, headers=headers, base_url_override=base_url_override
         )
-        if http_client is None:
+        if http_client_override is None:
+            request_headers: dict[str, str] = {**(headers or {})}
+            # Empty api_key is an advanced opt-out from sending Authorization.
+            if api_key != "":
+                request_headers["Authorization"] = f"Api-Key {api_key}"
             self._http_client = httpx.Client(
                 base_url=self._options.base_url,
-                headers={"Authorization": f"Api-Key {api_key}"},
+                headers=with_user_agent(request_headers),
             )
             self.close_http_client_on_close = (
                 True
                 if close_http_client_on_close is None
                 else close_http_client_on_close
             )
         else:
-            self._http_client = http_client
+            self._http_client = http_client_override
             self.close_http_client_on_close = (
                 False
                 if close_http_client_on_close is None
@@ -132,39 +144,45 @@ def __init__(
         self,
         *,
         api_key: str,
+        headers: Mapping[str, str] | None = None,
         base_url_override: str | None = None,
-        http_client: httpx.AsyncClient | None = None,
+        http_client_override: httpx.AsyncClient | None = None,
         close_http_client_on_close: bool | None = None,
     ) -> None:
         """Create a new asynchronous management client.
 
         Args:
             api_key: API key for authentication.
+            headers: Additional headers to send on every request.
             base_url_override: Override the default base URL. When ``None``,
                 :meth:`default_base_url` is used.
-            http_client: Pre-configured httpx async client. When provided,
-                the caller is responsible for setting base URL and auth
-                headers.
+            http_client_override: Pre-configured httpx async client. When
+                provided, the caller is responsible for setting base URL
+                and all headers.
             close_http_client_on_close: Whether :meth:`close` should close
                 the underlying HTTP client. Defaults to ``True`` when the
-                client is created internally, ``False`` when *http_client*
-                is provided.
+                client is created internally, ``False`` when
+                *http_client_override* is provided.
         """
         self._options = ManagementClientOptions(
-            api_key=api_key, base_url_override=base_url_override
+            api_key=api_key, headers=headers, base_url_override=base_url_override
         )
-        if http_client is None:
+        if http_client_override is None:
+            request_headers: dict[str, str] = {**(headers or {})}
+            # Empty api_key is an advanced opt-out from sending Authorization.
+            if api_key != "":
+                request_headers["Authorization"] = f"Api-Key {api_key}"
             self._http_client = httpx.AsyncClient(
                 base_url=self._options.base_url,
-                headers={"Authorization": f"Api-Key {api_key}"},
+                headers=with_user_agent(request_headers),
             )
             self.close_http_client_on_close = (
                 True
                 if close_http_client_on_close is None
                 else close_http_client_on_close
             )
         else:
-            self._http_client = http_client
+            self._http_client = http_client_override
             self.close_http_client_on_close = (
                 False
                 if close_http_client_on_close is None

diff --git a/baseten/client/_user_agent.py b/baseten/client/_user_agent.py
@@ -0,0 +1,25 @@
+import platform
+from collections.abc import Mapping
+from importlib.metadata import PackageNotFoundError, version
+
+
+def _package_version() -> str:
+    try:
+        return version("baseten")
+    except PackageNotFoundError:
+        return "dev"
+
+
+def user_agent_header() -> str:
+    """Build a User-Agent value like ``baseten-python/0.9.0 (Python/3.13.2; Linux)``."""
+    return (
+        f"baseten-python/{_package_version()} "
+        f"(Python/{platform.python_version()}; {platform.system()})"
+    )
+
+
+def with_user_agent(headers: Mapping[str, str]) -> dict[str, str]:
+    """Return a copy of ``headers`` with our User-Agent set, unless one is already present."""
+    if any(key.lower() == "user-agent" for key in headers):
+        return dict(headers)
+    return {**headers, "User-Agent": user_agent_header()}