chore: initial public snapshot for github upload

2026-03-26 20:06:14 +08:00
commit 0e5ecd930e
3497 changed files with 1586236 additions and 0 deletions
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/init.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/init.py
@@ -0,0 +1,42 @@
+from typing import TYPE_CHECKING
+
+import litellm
+from litellm.proxy.guardrails.guardrail_hooks.openai.moderations import (
+    OpenAIModerationGuardrail,
+)
+from litellm.types.guardrails import SupportedGuardrailIntegrations
+
+if TYPE_CHECKING:
+    from litellm.types.guardrails import Guardrail, LitellmParams
+
+
+def initialize_guardrail(litellm_params: "LitellmParams", guardrail: "Guardrail"):
+    guardrail_name = guardrail.get("guardrail_name")
+    if not guardrail_name:
+        raise ValueError("OpenAI Moderation: guardrail_name is required")
+
+    openai_moderation_guardrail = OpenAIModerationGuardrail(
+        guardrail_name=guardrail_name,
+        **{
+            **litellm_params.model_dump(exclude_none=True),
+            "api_key": litellm_params.api_key,
+            "api_base": litellm_params.api_base,
+            "default_on": litellm_params.default_on,
+            "event_hook": litellm_params.mode,
+            "model": litellm_params.model,
+        },
+    )
+
+    litellm.logging_callback_manager.add_litellm_callback(openai_moderation_guardrail)
+
+    return openai_moderation_guardrail
+
+
+guardrail_initializer_registry = {
+    SupportedGuardrailIntegrations.OPENAI_MODERATION.value: initialize_guardrail,
+}
+
+
+guardrail_class_registry = {
+    SupportedGuardrailIntegrations.OPENAI_MODERATION.value: OpenAIModerationGuardrail,
+}
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/base.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/base.py
@@ -0,0 +1,52 @@
+from typing import TYPE_CHECKING, List, Optional
+
+if TYPE_CHECKING:
+    from litellm.types.llms.openai import AllMessageValues
+
+
+class OpenAIGuardrailBase:
+    """
+    Base class for OpenAI guardrails.
+    """
+
+    def get_user_prompt(self, messages: List["AllMessageValues"]) -> Optional[str]:
+        """
+        Get the last consecutive block of messages from the user.
+
+        Example:
+        messages = [
+            {"role": "user", "content": "Hello, how are you?"},
+            {"role": "assistant", "content": "I'm good, thank you!"},
+            {"role": "user", "content": "What is the weather in Tokyo?"},
+        ]
+        get_user_prompt(messages) -> "What is the weather in Tokyo?"
+        """
+        from litellm.litellm_core_utils.prompt_templates.common_utils import (
+            convert_content_list_to_str,
+        )
+
+        if not messages:
+            return None
+
+        # Iterate from the end to find the last consecutive block of user messages
+        user_messages = []
+        for message in reversed(messages):
+            if message.get("role") == "user":
+                user_messages.append(message)
+            else:
+                # Stop when we hit a non-user message
+                break
+
+        if not user_messages:
+            return None
+
+        # Reverse to get the messages in chronological order
+        user_messages.reverse()
+
+        user_prompt = ""
+        for message in user_messages:
+            text_content = convert_content_list_to_str(message)
+            user_prompt += text_content + "\n"
+
+        result = user_prompt.strip()
+        return result if result else None
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/moderations.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/openai/moderations.py
@@ -0,0 +1,241 @@
+#!/usr/bin/env python3
+"""
+OpenAI Moderation Guardrail Integration for LiteLLM
+"""
+
+from typing import (
+    TYPE_CHECKING,
+    Literal,
+    Optional,
+    Type,
+)
+
+from fastapi import HTTPException
+
+from litellm._logging import verbose_proxy_logger
+from litellm.integrations.custom_guardrail import (
+    CustomGuardrail,
+    log_guardrail_information,
+)
+from litellm.litellm_core_utils.litellm_logging import Logging as LiteLLMLoggingObj
+from litellm.llms.custom_httpx.http_handler import (
+    get_async_httpx_client,
+    httpxSpecialProvider,
+)
+from litellm.types.utils import GenericGuardrailAPIInputs
+
+from .base import OpenAIGuardrailBase
+
+if TYPE_CHECKING:
+    from litellm.types.llms.openai import OpenAIModerationResponse
+    from litellm.types.proxy.guardrails.guardrail_hooks.base import GuardrailConfigModel
+
+
+class OpenAIModerationGuardrail(OpenAIGuardrailBase, CustomGuardrail):
+    """
+    LiteLLM Built-in Guardrail for OpenAI Content Moderation.
+
+    This guardrail scans prompts and responses using the OpenAI Moderation API to detect
+    harmful content, including violence, hate, harassment, self-harm, sexual content, etc.
+
+    Configuration:
+        guardrail_name: Name of the guardrail instance
+        api_key: OpenAI API key
+        api_base: OpenAI API endpoint
+        model: OpenAI moderation model to use
+        default_on: Whether to enable by default
+    """
+
+    def __init__(
+        self,
+        guardrail_name: str,
+        api_key: Optional[str] = None,
+        api_base: Optional[str] = None,
+        model: Optional[
+            Literal["omni-moderation-latest", "text-moderation-latest"]
+        ] = None,
+        **kwargs,
+    ):
+        """Initialize OpenAI Moderation guardrail handler."""
+        from litellm.types.guardrails import GuardrailEventHooks
+
+        # Initialize parent CustomGuardrail
+        supported_event_hooks = [
+            GuardrailEventHooks.pre_call,
+            GuardrailEventHooks.during_call,
+            GuardrailEventHooks.post_call,
+        ]
+        super().__init__(
+            guardrail_name=guardrail_name,
+            supported_event_hooks=supported_event_hooks,
+            **kwargs,
+        )
+
+        self.async_handler = get_async_httpx_client(
+            llm_provider=httpxSpecialProvider.GuardrailCallback
+        )
+
+        # Store configuration
+        self.api_key = api_key or self._get_api_key()
+        self.api_base = api_base or "https://api.openai.com/v1"
+        self.model: Literal["omni-moderation-latest", "text-moderation-latest"] = (
+            model or "omni-moderation-latest"
+        )
+
+        if not self.api_key:
+            raise ValueError(
+                "OpenAI Moderation: api_key is required. Set OPENAI_API_KEY environment variable or pass it in configuration."
+            )
+
+        verbose_proxy_logger.debug(
+            f"Initialized OpenAI Moderation Guardrail: {guardrail_name} with model: {self.model}"
+        )
+
+    def _get_api_key(self) -> Optional[str]:
+        """Get API key from environment variables or litellm configuration"""
+        import os
+
+        import litellm
+        from litellm.secret_managers.main import get_secret_str
+
+        return (
+            os.environ.get("OPENAI_API_KEY")
+            or litellm.api_key
+            or litellm.openai_key
+            or get_secret_str("OPENAI_API_KEY")
+        )
+
+    async def async_make_request(self, input_text: str) -> "OpenAIModerationResponse":
+        """
+        Make a request to the OpenAI Moderation API.
+        """
+        request_body = {"model": self.model, "input": input_text}
+
+        verbose_proxy_logger.debug("OpenAI Moderation guard request: %s", request_body)
+
+        response = await self.async_handler.post(
+            url=f"{self.api_base}/moderations",
+            headers={
+                "Authorization": f"Bearer {self.api_key}",
+                "Content-Type": "application/json",
+            },
+            json=request_body,
+        )
+
+        verbose_proxy_logger.debug(
+            "OpenAI Moderation guard response: %s", response.json()
+        )
+
+        if response.status_code != 200:
+            raise HTTPException(
+                status_code=response.status_code,
+                detail={
+                    "error": "OpenAI Moderation API request failed",
+                    "details": response.text,
+                },
+            )
+
+        from litellm.types.llms.openai import OpenAIModerationResponse
+
+        return OpenAIModerationResponse(**response.json())
+
+    def _check_moderation_result(
+        self, moderation_response: "OpenAIModerationResponse"
+    ) -> None:
+        """
+        Check if the moderation response indicates harmful content and raise exception if needed.
+        """
+        if not moderation_response.results:
+            return
+
+        result = moderation_response.results[0]
+        if result.flagged:
+            # Build detailed violation information
+            violated_categories = []
+            if result.categories:
+                for category, is_violated in result.categories.items():
+                    if is_violated:
+                        violated_categories.append(category)
+
+            violation_details = {
+                "violated_categories": violated_categories,
+                "category_scores": result.category_scores or {},
+            }
+
+            verbose_proxy_logger.warning(
+                "OpenAI Moderation: Content flagged for violations: %s",
+                violation_details,
+            )
+
+            raise HTTPException(
+                status_code=400,
+                detail={
+                    "error": "Violated OpenAI moderation policy",
+                    "moderation_result": violation_details,
+                },
+            )
+
+    @log_guardrail_information
+    async def apply_guardrail(
+        self,
+        inputs: GenericGuardrailAPIInputs,
+        request_data: dict,
+        input_type: Literal["request", "response"],
+        logging_obj: Optional["LiteLLMLoggingObj"] = None,
+    ) -> GenericGuardrailAPIInputs:
+        """
+        Apply OpenAI moderation guardrail using the unified guardrail interface.
+
+        This method is called by the UnifiedLLMGuardrails system for all endpoint types
+        (chat completions, embeddings, responses API, etc.).
+
+        Args:
+            inputs: GenericGuardrailAPIInputs containing texts and/or structured_messages
+            request_data: The original request data
+            input_type: Whether this is a "request" (pre-call) or "response" (post-call)
+            logging_obj: Optional logging object
+
+        Returns:
+            The inputs unchanged (moderation doesn't modify content, only blocks)
+
+        Raises:
+            HTTPException: If content violates moderation policy
+        """
+        # Extract text to moderate from inputs
+        text_to_moderate: Optional[str] = None
+
+        # Prefer structured_messages if available (has role context)
+        if structured_messages := inputs.get("structured_messages"):
+            text_to_moderate = self.get_user_prompt(structured_messages)
+
+        # Fall back to texts
+        if not text_to_moderate:
+            if texts := inputs.get("texts"):
+                # Join all texts for moderation
+                text_to_moderate = "\n".join(texts)
+
+        if not text_to_moderate:
+            verbose_proxy_logger.debug(
+                "OpenAI Moderation: No text content to moderate in inputs"
+            )
+            return inputs
+
+        # Make moderation request
+        moderation_response = await self.async_make_request(input_text=text_to_moderate)
+
+        # Check if content is flagged and raise exception if needed
+        self._check_moderation_result(moderation_response)
+
+        # Moderation doesn't modify content, just blocks - return inputs unchanged
+        return inputs
+
+    @staticmethod
+    def get_config_model() -> Optional[Type["GuardrailConfigModel"]]:
+        """
+        Get the config model for the OpenAI Moderation guardrail.
+        """
+        from litellm.types.proxy.guardrails.guardrail_hooks.openai.openai_moderation import (
+            OpenAIModerationGuardrailConfigModel,
+        )
+
+        return OpenAIModerationGuardrailConfigModel