chore: initial public snapshot for github upload

2026-03-26 20:06:14 +08:00
commit 0e5ecd930e
3497 changed files with 1586236 additions and 0 deletions
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/llms/base_llm/ocr/init.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/llms/base_llm/ocr/init.py
@@ -0,0 +1,22 @@
+"""Base OCR transformation module."""
+from .transformation import (
+    BaseOCRConfig,
+    DocumentType,
+    OCRPage,
+    OCRPageDimensions,
+    OCRPageImage,
+    OCRRequestData,
+    OCRResponse,
+    OCRUsageInfo,
+)
+
+__all__ = [
+    "BaseOCRConfig",
+    "DocumentType",
+    "OCRResponse",
+    "OCRPage",
+    "OCRPageDimensions",
+    "OCRPageImage",
+    "OCRUsageInfo",
+    "OCRRequestData",
+]
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/llms/base_llm/ocr/transformation.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/llms/base_llm/ocr/transformation.py
@@ -0,0 +1,258 @@
+"""
+Base OCR transformation configuration.
+"""
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
+
+import httpx
+from pydantic import PrivateAttr
+
+from litellm.llms.base_llm.chat.transformation import BaseLLMException
+from litellm.types.llms.base import LiteLLMPydanticObjectBase
+
+if TYPE_CHECKING:
+    from litellm.litellm_core_utils.litellm_logging import Logging as LiteLLMLoggingObj
+else:
+    LiteLLMLoggingObj = Any
+
+
+# DocumentType for OCR - providers always receive a dict with
+# type="document_url" or type="image_url" (str values only).
+# File-type inputs are preprocessed to this format in litellm/ocr/main.py.
+DocumentType = Dict[str, str]
+
+
+class OCRPageDimensions(LiteLLMPydanticObjectBase):
+    """Page dimensions from OCR response."""
+
+    dpi: Optional[int] = None
+    height: Optional[int] = None
+    width: Optional[int] = None
+
+
+class OCRPageImage(LiteLLMPydanticObjectBase):
+    """Image extracted from OCR page."""
+
+    image_base64: Optional[str] = None
+    bbox: Optional[Dict[str, Any]] = None
+
+    model_config = {"extra": "allow"}
+
+
+class OCRPage(LiteLLMPydanticObjectBase):
+    """Single page from OCR response."""
+
+    index: int
+    markdown: str
+    images: Optional[List[OCRPageImage]] = None
+    dimensions: Optional[OCRPageDimensions] = None
+
+    model_config = {"extra": "allow"}
+
+
+class OCRUsageInfo(LiteLLMPydanticObjectBase):
+    """Usage information from OCR response."""
+
+    pages_processed: Optional[int] = None
+    doc_size_bytes: Optional[int] = None
+
+    model_config = {"extra": "allow"}
+
+
+class OCRResponse(LiteLLMPydanticObjectBase):
+    """
+    Standard OCR response format.
+    Standardized to Mistral OCR format - other providers should transform to this format.
+    """
+
+    pages: List[OCRPage]
+    model: str
+    document_annotation: Optional[Any] = None
+    usage_info: Optional[OCRUsageInfo] = None
+    object: str = "ocr"
+
+    model_config = {"extra": "allow"}
+
+    # Define private attributes using PrivateAttr
+    _hidden_params: dict = PrivateAttr(default_factory=dict)
+
+
+class OCRRequestData(LiteLLMPydanticObjectBase):
+    """OCR request data structure."""
+
+    data: Optional[Union[Dict, bytes]] = None
+    files: Optional[Dict[str, Any]] = None
+
+
+class BaseOCRConfig:
+    """
+    Base configuration for OCR transformations.
+    Handles provider-agnostic OCR operations.
+    """
+
+    def __init__(self) -> None:
+        pass
+
+    def get_supported_ocr_params(self, model: str) -> list:
+        """
+        Get supported OCR parameters for this provider.
+        Override this method in provider-specific implementations.
+        """
+        return []
+
+    def map_ocr_params(
+        self,
+        non_default_params: dict,
+        optional_params: dict,
+        model: str,
+    ) -> dict:
+        """Map OCR parameters to provider-specific parameters."""
+        return optional_params
+
+    def validate_environment(
+        self,
+        headers: Dict,
+        model: str,
+        api_key: Optional[str] = None,
+        api_base: Optional[str] = None,
+        litellm_params: Optional[dict] = None,
+        **kwargs,
+    ) -> Dict:
+        """
+        Validate environment and return headers.
+        Override in provider-specific implementations.
+        """
+        return headers
+
+    def get_complete_url(
+        self,
+        api_base: Optional[str],
+        model: str,
+        optional_params: dict,
+        litellm_params: Optional[dict] = None,
+        **kwargs,
+    ) -> str:
+        """
+        Get complete URL for OCR endpoint.
+        Override in provider-specific implementations.
+        """
+        raise NotImplementedError("get_complete_url must be implemented by provider")
+
+    def transform_ocr_request(
+        self,
+        model: str,
+        document: DocumentType,
+        optional_params: dict,
+        headers: dict,
+        **kwargs,
+    ) -> OCRRequestData:
+        """
+        Transform OCR request to provider-specific format.
+        Override in provider-specific implementations.
+
+        Note: By the time this method is called, any file-type documents have already
+        been converted to document_url/image_url format with base64 data URIs by
+        the preprocessing in litellm/ocr/main.py.
+
+        Args:
+            model: Model name
+            document: Document to process - always a dict with type="document_url" or type="image_url"
+            optional_params: Optional parameters for the request
+            headers: Request headers
+
+        Returns:
+            OCRRequestData with data and files fields
+        """
+        raise NotImplementedError(
+            "transform_ocr_request must be implemented by provider"
+        )
+
+    async def async_transform_ocr_request(
+        self,
+        model: str,
+        document: DocumentType,
+        optional_params: dict,
+        headers: dict,
+        **kwargs,
+    ) -> OCRRequestData:
+        """
+        Async transform OCR request to provider-specific format.
+        Optional method - providers can override if they need async transformations
+        (e.g., Azure AI for URL-to-base64 conversion).
+
+        Default implementation falls back to sync transform_ocr_request.
+
+        Args:
+            model: Model name
+            document: Document to process (Mistral format dict, or file path, bytes, etc.)
+            optional_params: Optional parameters for the request
+            headers: Request headers
+
+        Returns:
+            OCRRequestData with data and files fields
+        """
+        # Default implementation: call sync version
+        return self.transform_ocr_request(
+            model=model,
+            document=document,
+            optional_params=optional_params,
+            headers=headers,
+            **kwargs,
+        )
+
+    def transform_ocr_response(
+        self,
+        model: str,
+        raw_response: httpx.Response,
+        logging_obj: LiteLLMLoggingObj,
+        **kwargs,
+    ) -> OCRResponse:
+        """
+        Transform provider-specific OCR response to standard format.
+        Override in provider-specific implementations.
+        """
+        raise NotImplementedError(
+            "transform_ocr_response must be implemented by provider"
+        )
+
+    async def async_transform_ocr_response(
+        self,
+        model: str,
+        raw_response: httpx.Response,
+        logging_obj: LiteLLMLoggingObj,
+        **kwargs,
+    ) -> OCRResponse:
+        """
+        Async transform provider-specific OCR response to standard format.
+        Optional method - providers can override if they need async transformations
+        (e.g., Azure Document Intelligence for async operation polling).
+
+        Default implementation falls back to sync transform_ocr_response.
+
+        Args:
+            model: Model name
+            raw_response: Raw HTTP response
+            logging_obj: Logging object
+
+        Returns:
+            OCRResponse in standard format
+        """
+        # Default implementation: call sync version
+        return self.transform_ocr_response(
+            model=model,
+            raw_response=raw_response,
+            logging_obj=logging_obj,
+            **kwargs,
+        )
+
+    def get_error_class(
+        self,
+        error_message: str,
+        status_code: int,
+        headers: dict,
+    ) -> Exception:
+        """Get appropriate error class for the provider."""
+        return BaseLLMException(
+            status_code=status_code,
+            message=error_message,
+            headers=headers,
+        )