fix: One more attempt resolving dynamically the tokens.

mgiannakopoulos · mgiannakopoulos · commit c93ff7d54df8 · 2025-12-03T10:52:08.000-05:00
diff --git a/singlestoredb/ai/__init__.py b/singlestoredb/ai/__init__.py
@@ -1,2 +1,3 @@
 from .chat import SingleStoreChatFactory  # noqa: F401
+from .debugv1 import SingleStoreChatFactoryDebugV1  # noqa: F401
 from .embeddings import SingleStoreEmbeddingsFactory  # noqa: F401
diff --git a/singlestoredb/ai/debugv1.py b/singlestoredb/ai/debugv1.py
@@ -0,0 +1,198 @@
+import os
+from typing import Any
+from typing import Callable
+from typing import Optional
+from typing import Union
+
+import httpx
+
+from singlestoredb import manage_workspaces
+from singlestoredb.ai.utils import SingleStoreOpenAIAuth
+from singlestoredb.management.inference_api import InferenceAPIInfo
+
+try:
+    from langchain_openai import ChatOpenAI
+except ImportError:
+    raise ImportError(
+        'Could not import langchain_openai python package. '
+        'Please install it with `pip install langchain_openai`.',
+    )
+
+try:
+    from langchain_aws import ChatBedrockConverse
+except ImportError:
+    raise ImportError(
+        'Could not import langchain-aws python package. '
+        'Please install it with `pip install langchain-aws`.',
+    )
+
+import boto3
+from botocore import UNSIGNED
+from botocore.config import Config
+
+
+def SingleStoreChatFactoryDebugV1(
+    model_name: str,
+    api_key: Optional[Union[Optional[str], Callable[[], Optional[str]]]] = None,
+    streaming: bool = True,
+    http_client: Optional[httpx.Client] = None,
+    obo_token: Optional[Union[Optional[str], Callable[[], Optional[str]]]] = None,
+    obo_token_getter: Optional[Callable[[], Optional[str]]] = None,
+    base_url: Optional[str] = None,
+    hosting_platform: Optional[str] = None,
+    timeout: Optional[float] = None,
+    **kwargs: Any,
+) -> Union[ChatOpenAI, ChatBedrockConverse]:
+    """Return a chat model instance (ChatOpenAI or ChatBedrockConverse).
+    """
+    # Handle api_key and obo_token as callable functions
+    if callable(api_key):
+        api_key_getter_fn = api_key
+    else:
+        def api_key_getter_fn() -> Optional[str]:
+            if api_key is None:
+                return os.environ.get('SINGLESTOREDB_USER_TOKEN')
+            return api_key
+
+    if obo_token_getter is not None:
+        obo_token_getter_fn = obo_token_getter
+    else:
+        if callable(obo_token):
+            obo_token_getter_fn = obo_token
+        else:
+            def obo_token_getter_fn() -> Optional[str]:
+                return obo_token
+
+    # handle model info
+    if base_url is None:
+        base_url = os.environ.get('SINGLESTOREDB_INFERENCE_API_BASE_URL')
+    if hosting_platform is None:
+        hosting_platform = os.environ.get('SINGLESTOREDB_INFERENCE_API_HOSTING_PLATFORM')
+    if base_url is None or hosting_platform is None:
+        inference_api_manager = (
+            manage_workspaces().organizations.current.inference_apis
+        )
+        info = inference_api_manager.get(model_name=model_name)
+    else:
+        info = InferenceAPIInfo(
+            service_id='',
+            model_name=model_name,
+            name='',
+            connection_url=base_url,
+            project_id='',
+            hosting_platform=hosting_platform,
+        )
+    if base_url is not None:
+        info.connection_url = base_url
+    if hosting_platform is not None:
+        info.hosting_platform = hosting_platform
+
+    # Extract timeouts from http_client if provided
+    t = http_client.timeout if http_client is not None else None
+    connect_timeout = None
+    read_timeout = None
+    if t is not None:
+        if isinstance(t, httpx.Timeout):
+            if t.connect is not None:
+                connect_timeout = float(t.connect)
+            if t.read is not None:
+                read_timeout = float(t.read)
+            if connect_timeout is None and read_timeout is not None:
+                connect_timeout = read_timeout
+            if read_timeout is None and connect_timeout is not None:
+                read_timeout = connect_timeout
+        elif isinstance(t, (int, float)):
+            connect_timeout = float(t)
+            read_timeout = float(t)
+    if timeout is not None:
+        connect_timeout = timeout
+        read_timeout = timeout
+        t = httpx.Timeout(timeout)
+
+    if info.hosting_platform == 'Amazon':
+        # Instantiate Bedrock client
+        cfg_kwargs = {
+            'signature_version': UNSIGNED,
+            'retries': {'max_attempts': 1, 'mode': 'standard'},
+        }
+        if read_timeout is not None:
+            cfg_kwargs['read_timeout'] = read_timeout
+        if connect_timeout is not None:
+            cfg_kwargs['connect_timeout'] = connect_timeout
+
+        cfg = Config(**cfg_kwargs)
+        client = boto3.client(
+            'bedrock-runtime',
+            endpoint_url=info.connection_url,
+            region_name='us-east-1',
+            aws_access_key_id='placeholder',
+            aws_secret_access_key='placeholder',
+            config=cfg,
+        )
+
+        def _inject_headers(request: Any, **_ignored: Any) -> None:
+            """Inject dynamic auth/OBO headers prior to Bedrock sending."""
+            if api_key_getter_fn is not None:
+                token_val = api_key_getter_fn()
+                if token_val:
+                    request.headers['Authorization'] = f'Bearer {token_val}'
+            if obo_token_getter_fn is not None:
+                obo_val = obo_token_getter_fn()
+                if obo_val:
+                    request.headers['X-S2-OBO'] = obo_val
+            request.headers.pop('X-Amz-Date', None)
+            request.headers.pop('X-Amz-Security-Token', None)
+
+        emitter = client._endpoint._event_emitter
+        emitter.register_first(
+            'before-send.bedrock-runtime.Converse',
+            _inject_headers,
+        )
+        emitter.register_first(
+            'before-send.bedrock-runtime.ConverseStream',
+            _inject_headers,
+        )
+        emitter.register_first(
+            'before-send.bedrock-runtime.InvokeModel',
+            _inject_headers,
+        )
+        emitter.register_first(
+            'before-send.bedrock-runtime.InvokeModelWithResponseStream',
+            _inject_headers,
+        )
+
+        return ChatBedrockConverse(
+            model_id=model_name,
+            endpoint_url=info.connection_url,
+            region_name='us-east-1',
+            aws_access_key_id='placeholder',
+            aws_secret_access_key='placeholder',
+            disable_streaming=not streaming,
+            client=client,
+            **kwargs,
+        )
+
+    # OpenAI / Azure OpenAI path
+    if t is not None:
+        http_client_internal = httpx.Client(
+            timeout=t,
+            auth=SingleStoreOpenAIAuth(obo_token_getter_fn),
+        )
+    else:
+        http_client_internal = httpx.Client(
+            timeout=httpx.Timeout(timeout=600, connect=5.0),  # default OpenAI timeout
+            auth=SingleStoreOpenAIAuth(obo_token_getter_fn),
+        )
+
+    token = api_key_getter_fn()
+    openai_kwargs = dict(
+        base_url=info.connection_url,
+        api_key=token,
+        model=model_name,
+        streaming=streaming,
+    )
+    openai_kwargs['http_client'] = http_client_internal
+    return ChatOpenAI(
+        **openai_kwargs,
+        **kwargs,
+    )
diff --git a/singlestoredb/ai/utils.py b/singlestoredb/ai/utils.py
@@ -0,0 +1,24 @@
+import logging
+
+import httpx
+
+logger = logging.getLogger(__name__)
+
+
+class SingleStoreOpenAIAuth(httpx.Auth):
+    def __init__(self, obo_token_getter):  # type: ignore[no-untyped-def]
+        self.obo_token_getter_fn = obo_token_getter
+
+    def auth_flow(self, request: httpx.Request):  # type: ignore[no-untyped-def]
+        logger.info(f'auth_flow called for request to {request.url}')
+        if self.obo_token_getter_fn is not None:
+            logger.debug('obo_token_getter_fn is set, attempting to get token')
+            obo_val = self.obo_token_getter_fn()
+            if obo_val:
+                logger.info('OBO token retrieved successfully, adding X-S2-OBO header')
+                request.headers['X-S2-OBO'] = obo_val
+            else:
+                logger.warning('obo_token_getter_fn returned empty/None value')
+        else:
+            logger.debug('obo_token_getter_fn is None, skipping OBO token')
+        yield request

Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,3 @@`
`1`	`1`	`from .chat import SingleStoreChatFactory # noqa: F401`
	`2`	`+from .debugv1 import SingleStoreChatFactoryDebugV1 # noqa: F401`
`2`	`3`	`from .embeddings import SingleStoreEmbeddingsFactory # noqa: F401`