[Feat] Add Isaacus embeddings provider

adlumal · adlumal · commit 7d256214e5b1 · 2025-10-24T17:06:43.000+11:00
diff --git a/docs/my-website/docs/embedding/supported_embedding.md b/docs/my-website/docs/embedding/supported_embedding.md
@@ -543,9 +543,56 @@ All models listed here https://docs.voyageai.com/embeddings/#models-and-specific
 
 | Model Name               | Function Call                                                                                                                                                      |
 |--------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| voyage-01 | `embedding(model="voyage/voyage-01", input)` | 
-| voyage-lite-01 | `embedding(model="voyage/voyage-lite-01", input)` | 
-| voyage-lite-01-instruct | `embedding(model="voyage/voyage-lite-01-instruct", input)` | 
+| voyage-01 | `embedding(model="voyage/voyage-01", input)` |
+| voyage-lite-01 | `embedding(model="voyage/voyage-lite-01", input)` |
+| voyage-lite-01-instruct | `embedding(model="voyage/voyage-lite-01-instruct", input)` |
+
+## Isaacus AI Embedding Models
+
+### Usage - Embedding
+```python
+from litellm import embedding
+import os
+
+os.environ['ISAACUS_API_KEY'] = ""
+response = embedding(
+    model="isaacus/kanon-2-embedder",
+    input=["good morning from litellm"],
+)
+print(response)
+```
+
+### Supported Models
+All models listed here https://docs.isaacus.com/api-reference/embeddings are supported
+
+| Model Name | Function Call |
+|------------|---------------|
+| kanon-2-embedder | `embedding(model="isaacus/kanon-2-embedder", input)` |
+
+**Supported optional params:**
+- `task` - Optimize embeddings for specific use case: `"retrieval/query"` (for search queries) or `"retrieval/document"` (for documents to be indexed)
+- `dimensions` - Optionally reduce embedding dimensionality (e.g., 256, 768, 1024)
+- `overflow_strategy` - How to handle text that exceeds model limits: `"drop_end"` (default, truncates text at the end)
+
+```python
+# Example with optional params
+response = embedding(
+    model="isaacus/kanon-2-embedder",
+    input=["contract text"],
+    task="retrieval/query",  # or "retrieval/document"
+    dimensions=1024,
+    overflow_strategy="drop_end"
+)
+```
+
+### Task Parameter
+
+Isaacus embeddings support task-specific optimization to improve retrieval accuracy. Set the `task` parameter based on your use case:
+
+- `"retrieval/query"` – for embedding search queries during retrieval
+- `"retrieval/document"` – for embedding documents during indexing
+
+> **Note:** Using the correct task type ensures optimal performance for legal document retrieval.
 
 ### Provider-specific Params
 
diff --git a/litellm/__init__.py b/litellm/__init__.py
@@ -68,6 +68,7 @@
     open_ai_embedding_models,
     cohere_embedding_models,
     bedrock_embedding_models,
+    isaacus_embedding_models,
     known_tokenizer_config,
     BEDROCK_INVOKE_PROVIDERS_LITERAL,
     BEDROCK_EMBEDDING_PROVIDERS_LITERAL,
@@ -234,6 +235,7 @@
 datarobot_key: Optional[str] = None
 predibase_key: Optional[str] = None
 huggingface_key: Optional[str] = None
+isaacus_key: Optional[str] = None
 vertex_project: Optional[str] = None
 vertex_location: Optional[str] = None
 predibase_tenant_id: Optional[str] = None
@@ -1192,6 +1194,7 @@ def add_known_models():
     VoyageContextualEmbeddingConfig,
 )
 from .llms.infinity.embedding.transformation import InfinityEmbeddingConfig
+from .llms.isaacus.embedding.transformation import IsaacusEmbeddingConfig
 from .llms.azure_ai.chat.transformation import AzureAIStudioConfig
 from .llms.mistral.chat.transformation import MistralConfig
 from .llms.openai.responses.transformation import OpenAIResponsesAPIConfig
diff --git a/litellm/constants.py b/litellm/constants.py
@@ -895,6 +895,11 @@
         "twelvelabs.marengo-embed-2-7-v1:0",
     ]
 )
+isaacus_embedding_models: set = set(
+    [
+        "kanon-2-embedder",
+    ]
+)
 
 known_tokenizer_config = {
     "mistralai/Mistral-7B-Instruct-v0.1": {
diff --git a/litellm/litellm_core_utils/get_llm_provider_logic.py b/litellm/litellm_core_utils/get_llm_provider_logic.py
@@ -372,6 +372,12 @@ def get_llm_provider(  # noqa: PLR0915
             custom_llm_provider = "lemonade"
         elif model.startswith("heroku/"):
             custom_llm_provider = "heroku"
+        # isaacus models
+        elif (
+            model.startswith("isaacus/")
+            or model in litellm.isaacus_embedding_models
+        ):
+            custom_llm_provider = "isaacus"
         # cometapi models
         elif model.startswith("cometapi/"):
             custom_llm_provider = "cometapi"
diff --git a/litellm/llms/isaacus/__init__.py b/litellm/llms/isaacus/__init__.py
@@ -0,0 +1 @@
+"""Isaacus LLM Provider."""
diff --git a/litellm/llms/isaacus/embedding/__init__.py b/litellm/llms/isaacus/embedding/__init__.py
@@ -0,0 +1,3 @@
+from .transformation import IsaacusEmbeddingConfig, IsaacusError
+
+__all__ = ["IsaacusEmbeddingConfig", "IsaacusError"]
diff --git a/litellm/llms/isaacus/embedding/transformation.py b/litellm/llms/isaacus/embedding/transformation.py
@@ -0,0 +1,196 @@
+"""
+Transformation logic from OpenAI /v1/embeddings format to Isaacus's /v1/embeddings format.
+
+Reference: https://docs.isaacus.com/api-reference/embeddings
+"""
+
+from typing import List, Optional, Union, cast
+
+import httpx
+
+from litellm.litellm_core_utils.litellm_logging import Logging as LiteLLMLoggingObj
+from litellm.llms.base_llm.chat.transformation import BaseLLMException
+from litellm.llms.base_llm.embedding.transformation import BaseEmbeddingConfig
+from litellm.secret_managers.main import get_secret_str
+from litellm.types.llms.openai import AllEmbeddingInputValues, AllMessageValues
+from litellm.types.utils import EmbeddingResponse, Usage
+
+
+class IsaacusError(BaseLLMException):
+    def __init__(
+        self,
+        status_code: int,
+        message: str,
+        headers: Union[dict, httpx.Headers] = {},
+    ):
+        self.status_code = status_code
+        self.message = message
+        self.request = httpx.Request(
+            method="POST", url="https://api.isaacus.com/v1/embeddings"
+        )
+        self.response = httpx.Response(status_code=status_code, request=self.request)
+        super().__init__(
+            status_code=status_code,
+            message=message,
+            headers=headers,
+        )
+
+
+class IsaacusEmbeddingConfig(BaseEmbeddingConfig):
+    """
+    Reference: https://docs.isaacus.com/api-reference/embeddings
+
+    The Isaacus embeddings API provides access to the Kanon 2 Embedder for law.
+    """
+
+    def __init__(self) -> None:
+        pass
+
+    def get_complete_url(
+        self,
+        api_base: Optional[str],
+        api_key: Optional[str],
+        model: str,
+        optional_params: dict,
+        litellm_params: dict,
+        stream: Optional[bool] = None,
+    ) -> str:
+        if api_base:
+            if not api_base.endswith("/embeddings"):
+                api_base = f"{api_base}/embeddings"
+            return api_base
+        return "https://api.isaacus.com/v1/embeddings"
+
+    def get_supported_openai_params(self, model: str) -> list:
+        return ["dimensions"]
+
+    def map_openai_params(
+        self,
+        non_default_params: dict,
+        optional_params: dict,
+        model: str,
+        drop_params: bool,
+    ) -> dict:
+        """
+        Map OpenAI params to Isaacus params
+
+        Reference: https://docs.isaacus.com/api-reference/embeddings
+        """
+        if "dimensions" in non_default_params:
+            optional_params["dimensions"] = non_default_params["dimensions"]
+        return optional_params
+
+    def validate_environment(
+        self,
+        headers: dict,
+        model: str,
+        messages: List[AllMessageValues],
+        optional_params: dict,
+        litellm_params: dict,
+        api_key: Optional[str] = None,
+        api_base: Optional[str] = None,
+    ) -> dict:
+        if api_key is None:
+            api_key = get_secret_str("ISAACUS_API_KEY")
+        return {
+            "Authorization": f"Bearer {api_key}",
+            "Content-Type": "application/json",
+        }
+
+    def transform_embedding_request(
+        self,
+        model: str,
+        input: AllEmbeddingInputValues,
+        optional_params: dict,
+        headers: dict,
+    ) -> dict:
+        """
+        Transform OpenAI-style embedding request to Isaacus format.
+
+        OpenAI uses 'input' while Isaacus uses 'texts'.
+        """
+        # Convert input to list of strings if needed
+        if isinstance(input, str):
+            texts = [input]
+        elif isinstance(input, list):
+            if len(input) > 0 and isinstance(input[0], (list, int)):
+                raise ValueError(
+                    "Isaacus does not support token array inputs. Input must be a string or list of strings."
+                )
+            texts = cast(List[str], input)
+        else:
+            texts = [input]
+
+        request_data = {
+            "model": model,
+            "texts": texts,
+        }
+
+        # Add optional parameters
+        # Isaacus-specific parameters: task, overflow_strategy, dimensions
+        if "task" in optional_params:
+            request_data["task"] = optional_params["task"]
+        if "overflow_strategy" in optional_params:
+            request_data["overflow_strategy"] = optional_params["overflow_strategy"]
+        if "dimensions" in optional_params:
+            request_data["dimensions"] = optional_params["dimensions"]
+
+        return request_data
+
+    def transform_embedding_response(
+        self,
+        model: str,
+        raw_response: httpx.Response,
+        model_response: EmbeddingResponse,
+        logging_obj: LiteLLMLoggingObj,
+        api_key: Optional[str] = None,
+        request_data: dict = {},
+        optional_params: dict = {},
+        litellm_params: dict = {},
+    ) -> EmbeddingResponse:
+        try:
+            raw_response_json = raw_response.json()
+        except Exception:
+            raise IsaacusError(
+                message=raw_response.text, status_code=raw_response.status_code
+            )
+
+        # Transform Isaacus response format to OpenAI format
+        # Isaacus format: {"embeddings": [{"embedding": [...], "index": 0}, ...], "usage": {"input_tokens": 10}}
+        # OpenAI format: {"data": [{"embedding": [...], "index": 0, "object": "embedding"}], "model": "...", "usage": {...}}
+
+        embeddings_data = raw_response_json.get("embeddings", [])
+        output_data = []
+
+        for emb_obj in embeddings_data:
+            output_data.append(
+                {
+                    "object": "embedding",
+                    "index": emb_obj.get("index", 0),
+                    "embedding": emb_obj.get("embedding", []),
+                }
+            )
+
+        model_response.model = model
+        model_response.data = output_data
+        model_response.object = "list"
+
+        # Set usage information
+        # Isaacus returns usage with "input_tokens"
+        usage_data = raw_response_json.get("usage", {})
+        input_tokens = usage_data.get("input_tokens", 0)
+
+        usage = Usage(
+            prompt_tokens=input_tokens,
+            total_tokens=input_tokens,
+        )
+        model_response.usage = usage
+
+        return model_response
+
+    def get_error_class(
+        self, error_message: str, status_code: int, headers: Union[dict, httpx.Headers]
+    ) -> BaseLLMException:
+        return IsaacusError(
+            message=error_message, status_code=status_code, headers=headers
+        )
diff --git a/litellm/main.py b/litellm/main.py
@@ -4579,6 +4579,24 @@ def embedding(  # noqa: PLR0915
                 aembedding=aembedding,
                 litellm_params={},
             )
+        elif custom_llm_provider == "isaacus":
+            api_key = (
+                api_key or litellm.isaacus_key or get_secret_str("ISAACUS_API_KEY")
+            )
+            response = base_llm_http_handler.embedding(
+                model=model,
+                input=input,
+                custom_llm_provider=custom_llm_provider,
+                api_base=api_base,
+                api_key=api_key,
+                logging_obj=logging,
+                timeout=timeout,
+                model_response=EmbeddingResponse(),
+                optional_params=optional_params,
+                client=client,
+                aembedding=aembedding,
+                litellm_params={},
+            )
         elif custom_llm_provider == "watsonx":
             credentials = IBMWatsonXMixin.get_watsonx_credentials(
                 optional_params=optional_params, api_key=api_key, api_base=api_base
diff --git a/litellm/types/utils.py b/litellm/types/utils.py
@@ -2510,6 +2510,7 @@ class LlmProviders(str, Enum):
     GALADRIEL = "galadriel"
     NEBIUS = "nebius"
     INFINITY = "infinity"
+    ISAACUS = "isaacus"
     DEEPGRAM = "deepgram"
     ELEVENLABS = "elevenlabs"
     NOVITA = "novita"
diff --git a/litellm/utils.py b/litellm/utils.py
@@ -7219,6 +7219,8 @@ def get_provider_embedding_config(
             return litellm.IBMWatsonXEmbeddingConfig()
         elif litellm.LlmProviders.INFINITY == provider:
             return litellm.InfinityEmbeddingConfig()
+        elif litellm.LlmProviders.ISAACUS == provider:
+            return litellm.IsaacusEmbeddingConfig()
         elif litellm.LlmProviders.SAMBANOVA == provider:
             return litellm.SambaNovaEmbeddingConfig()
         elif (
diff --git a/tests/llm_translation/test_isaacus_embedding.py b/tests/llm_translation/test_isaacus_embedding.py
diff --git a/tests/test_litellm/llms/isaacus/embedding/__init__.py b/tests/test_litellm/llms/isaacus/embedding/__init__.py
diff --git a/tests/test_litellm/llms/isaacus/embedding/test_transformation.py b/tests/test_litellm/llms/isaacus/embedding/test_transformation.py

Original file line number	Diff line number	Diff line change
`@@ -895,6 +895,11 @@`
`895`	`895`	`"twelvelabs.marengo-embed-2-7-v1:0",`
`896`	`896`	`]`
`897`	`897`	`)`
	`898`	`+isaacus_embedding_models: set = set(`
	`899`	`+ [`
	`900`	`+ "kanon-2-embedder",`
	`901`	`+ ]`
	`902`	`+)`
`898`	`903`
`899`	`904`	`known_tokenizer_config = {`
`900`	`905`	`"mistralai/Mistral-7B-Instruct-v0.1": {`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .transformation import IsaacusEmbeddingConfig, IsaacusError`
	`2`	`+`
	`3`	`+__all__ = ["IsaacusEmbeddingConfig", "IsaacusError"]`