chore: initial public snapshot for github upload

2026-03-26 20:06:14 +08:00
commit 0e5ecd930e
3497 changed files with 1586236 additions and 0 deletions
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/init.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/init.py
@@ -0,0 +1,3 @@
+from litellm.integrations.azure_sentinel.azure_sentinel import AzureSentinelLogger
+
+__all__ = ["AzureSentinelLogger"]
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/azure_sentinel.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/azure_sentinel.py
@@ -0,0 +1,304 @@
+"""
+Azure Sentinel Integration - sends logs to Azure Log Analytics using Logs Ingestion API
+
+Azure Sentinel uses Log Analytics workspaces for data storage. This integration sends
+LiteLLM logs to the Log Analytics workspace using the Azure Monitor Logs Ingestion API.
+
+Reference API: https://learn.microsoft.com/en-us/azure/azure-monitor/logs/logs-ingestion-api-overview
+
+`async_log_success_event` - used by litellm proxy to send logs to Azure Sentinel
+`async_log_failure_event` - used by litellm proxy to send failure logs to Azure Sentinel
+
+For batching specific details see CustomBatchLogger class
+"""
+
+import asyncio
+import os
+import traceback
+from typing import List, Optional
+
+from litellm._logging import verbose_logger
+from litellm.integrations.custom_batch_logger import CustomBatchLogger
+from litellm.llms.custom_httpx.http_handler import (
+    get_async_httpx_client,
+    httpxSpecialProvider,
+)
+from litellm.types.utils import StandardLoggingPayload
+
+
+class AzureSentinelLogger(CustomBatchLogger):
+    """
+    Logger that sends LiteLLM logs to Azure Sentinel via Azure Monitor Logs Ingestion API
+    """
+
+    def __init__(
+        self,
+        dcr_immutable_id: Optional[str] = None,
+        stream_name: Optional[str] = None,
+        endpoint: Optional[str] = None,
+        tenant_id: Optional[str] = None,
+        client_id: Optional[str] = None,
+        client_secret: Optional[str] = None,
+        **kwargs,
+    ):
+        """
+        Initialize Azure Sentinel logger using Logs Ingestion API
+
+        Args:
+            dcr_immutable_id (str, optional): Data Collection Rule (DCR) Immutable ID.
+                If not provided, will use AZURE_SENTINEL_DCR_IMMUTABLE_ID env var.
+            stream_name (str, optional): Stream name from DCR (e.g., "Custom-LiteLLM").
+                If not provided, will use AZURE_SENTINEL_STREAM_NAME env var or default to "Custom-LiteLLM".
+            endpoint (str, optional): Data Collection Endpoint (DCE) or DCR ingestion endpoint.
+                If not provided, will use AZURE_SENTINEL_ENDPOINT env var.
+            tenant_id (str, optional): Azure Tenant ID for OAuth2 authentication.
+                If not provided, will use AZURE_SENTINEL_TENANT_ID or AZURE_TENANT_ID env var.
+            client_id (str, optional): Azure Client ID (Application ID) for OAuth2 authentication.
+                If not provided, will use AZURE_SENTINEL_CLIENT_ID or AZURE_CLIENT_ID env var.
+            client_secret (str, optional): Azure Client Secret for OAuth2 authentication.
+                If not provided, will use AZURE_SENTINEL_CLIENT_SECRET or AZURE_CLIENT_SECRET env var.
+        """
+        self.async_httpx_client = get_async_httpx_client(
+            llm_provider=httpxSpecialProvider.LoggingCallback
+        )
+
+        self.dcr_immutable_id = dcr_immutable_id or os.getenv(
+            "AZURE_SENTINEL_DCR_IMMUTABLE_ID"
+        )
+        self.stream_name = stream_name or os.getenv(
+            "AZURE_SENTINEL_STREAM_NAME", "Custom-LiteLLM"
+        )
+        self.endpoint = endpoint or os.getenv("AZURE_SENTINEL_ENDPOINT")
+        self.tenant_id = (
+            tenant_id
+            or os.getenv("AZURE_SENTINEL_TENANT_ID")
+            or os.getenv("AZURE_TENANT_ID")
+        )
+        self.client_id = (
+            client_id
+            or os.getenv("AZURE_SENTINEL_CLIENT_ID")
+            or os.getenv("AZURE_CLIENT_ID")
+        )
+        self.client_secret = (
+            client_secret
+            or os.getenv("AZURE_SENTINEL_CLIENT_SECRET")
+            or os.getenv("AZURE_CLIENT_SECRET")
+        )
+
+        if not self.dcr_immutable_id:
+            raise ValueError(
+                "AZURE_SENTINEL_DCR_IMMUTABLE_ID is required. Set it as an environment variable or pass dcr_immutable_id parameter."
+            )
+        if not self.endpoint:
+            raise ValueError(
+                "AZURE_SENTINEL_ENDPOINT is required. Set it as an environment variable or pass endpoint parameter."
+            )
+        if not self.tenant_id:
+            raise ValueError(
+                "AZURE_SENTINEL_TENANT_ID or AZURE_TENANT_ID is required. Set it as an environment variable or pass tenant_id parameter."
+            )
+        if not self.client_id:
+            raise ValueError(
+                "AZURE_SENTINEL_CLIENT_ID or AZURE_CLIENT_ID is required. Set it as an environment variable or pass client_id parameter."
+            )
+        if not self.client_secret:
+            raise ValueError(
+                "AZURE_SENTINEL_CLIENT_SECRET or AZURE_CLIENT_SECRET is required. Set it as an environment variable or pass client_secret parameter."
+            )
+
+        # Build API endpoint: {Endpoint}/dataCollectionRules/{DCR Immutable ID}/streams/{Stream Name}?api-version=2023-01-01
+        self.api_endpoint = f"{self.endpoint.rstrip('/')}/dataCollectionRules/{self.dcr_immutable_id}/streams/{self.stream_name}?api-version=2023-01-01"
+
+        # OAuth2 scope for Azure Monitor
+        self.oauth_scope = "https://monitor.azure.com/.default"
+        self.oauth_token: Optional[str] = None
+        self.oauth_token_expires_at: Optional[float] = None
+
+        self.flush_lock = asyncio.Lock()
+        super().__init__(**kwargs, flush_lock=self.flush_lock)
+        asyncio.create_task(self.periodic_flush())
+        self.log_queue: List[StandardLoggingPayload] = []
+
+    async def _get_oauth_token(self) -> str:
+        """
+        Get OAuth2 Bearer token for Azure Monitor Logs Ingestion API
+
+        Returns:
+            Bearer token string
+        """
+        # Check if we have a valid cached token
+        import time
+
+        if (
+            self.oauth_token
+            and self.oauth_token_expires_at
+            and time.time() < self.oauth_token_expires_at - 60
+        ):  # Refresh 60 seconds before expiry
+            return self.oauth_token
+
+        # Get new token using client credentials flow
+        assert self.tenant_id is not None, "tenant_id is required"
+        assert self.client_id is not None, "client_id is required"
+        assert self.client_secret is not None, "client_secret is required"
+
+        token_url = (
+            f"https://login.microsoftonline.com/{self.tenant_id}/oauth2/v2.0/token"
+        )
+
+        token_data = {
+            "client_id": self.client_id,
+            "client_secret": self.client_secret,
+            "scope": self.oauth_scope,
+            "grant_type": "client_credentials",
+        }
+
+        response = await self.async_httpx_client.post(
+            url=token_url,
+            data=token_data,
+            headers={"Content-Type": "application/x-www-form-urlencoded"},
+        )
+
+        if response.status_code != 200:
+            raise Exception(
+                f"Failed to get OAuth2 token: {response.status_code} - {response.text}"
+            )
+
+        token_response = response.json()
+        self.oauth_token = token_response.get("access_token")
+        expires_in = token_response.get("expires_in", 3600)
+
+        if not self.oauth_token:
+            raise Exception("OAuth2 token response did not contain access_token")
+
+        # Cache token expiry time
+        import time
+
+        self.oauth_token_expires_at = time.time() + expires_in
+
+        return self.oauth_token
+
+    async def async_log_success_event(self, kwargs, response_obj, start_time, end_time):
+        """
+        Async Log success events to Azure Sentinel
+
+        - Gets StandardLoggingPayload from kwargs
+        - Adds to batch queue
+        - Flushes based on CustomBatchLogger settings
+
+        Raises:
+            Raises a NON Blocking verbose_logger.exception if an error occurs
+        """
+        try:
+            verbose_logger.debug(
+                "Azure Sentinel: Logging - Enters logging function for model %s", kwargs
+            )
+            standard_logging_payload = kwargs.get("standard_logging_object", None)
+
+            if standard_logging_payload is None:
+                verbose_logger.warning(
+                    "Azure Sentinel: standard_logging_object not found in kwargs"
+                )
+                return
+
+            self.log_queue.append(standard_logging_payload)
+
+            if len(self.log_queue) >= self.batch_size:
+                await self.async_send_batch()
+
+        except Exception as e:
+            verbose_logger.exception(
+                f"Azure Sentinel Layer Error - {str(e)}\n{traceback.format_exc()}"
+            )
+            pass
+
+    async def async_log_failure_event(self, kwargs, response_obj, start_time, end_time):
+        """
+        Async Log failure events to Azure Sentinel
+
+        - Gets StandardLoggingPayload from kwargs
+        - Adds to batch queue
+        - Flushes based on CustomBatchLogger settings
+
+        Raises:
+            Raises a NON Blocking verbose_logger.exception if an error occurs
+        """
+        try:
+            verbose_logger.debug(
+                "Azure Sentinel: Logging - Enters failure logging function for model %s",
+                kwargs,
+            )
+            standard_logging_payload = kwargs.get("standard_logging_object", None)
+
+            if standard_logging_payload is None:
+                verbose_logger.warning(
+                    "Azure Sentinel: standard_logging_object not found in kwargs"
+                )
+                return
+
+            self.log_queue.append(standard_logging_payload)
+
+            if len(self.log_queue) >= self.batch_size:
+                await self.async_send_batch()
+
+        except Exception as e:
+            verbose_logger.exception(
+                f"Azure Sentinel Layer Error - {str(e)}\n{traceback.format_exc()}"
+            )
+            pass
+
+    async def async_send_batch(self):
+        """
+        Sends the batch of logs to Azure Monitor Logs Ingestion API
+
+        Raises:
+            Raises a NON Blocking verbose_logger.exception if an error occurs
+        """
+        try:
+            if not self.log_queue:
+                return
+
+            verbose_logger.debug(
+                "Azure Sentinel - about to flush %s events", len(self.log_queue)
+            )
+
+            from litellm.litellm_core_utils.safe_json_dumps import safe_dumps
+
+            # Get OAuth2 token
+            bearer_token = await self._get_oauth_token()
+
+            # Convert log queue to JSON array format expected by Logs Ingestion API
+            # Each log entry should be a JSON object in the array
+            body = safe_dumps(self.log_queue)
+
+            # Set headers for Logs Ingestion API
+            headers = {
+                "Authorization": f"Bearer {bearer_token}",
+                "Content-Type": "application/json",
+            }
+
+            # Send the request
+            response = await self.async_httpx_client.post(
+                url=self.api_endpoint, data=body.encode("utf-8"), headers=headers
+            )
+
+            if response.status_code not in [200, 204]:
+                verbose_logger.error(
+                    "Azure Sentinel API error: status_code=%s, response=%s",
+                    response.status_code,
+                    response.text,
+                )
+                raise Exception(
+                    f"Failed to send logs to Azure Sentinel: {response.status_code} - {response.text}"
+                )
+
+            verbose_logger.debug(
+                "Azure Sentinel: Response from API status_code: %s",
+                response.status_code,
+            )
+
+        except Exception as e:
+            verbose_logger.exception(
+                f"Azure Sentinel Error sending batch API - {str(e)}\n{traceback.format_exc()}"
+            )
+        finally:
+            self.log_queue.clear()
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/example_standard_logging_payload.json
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/integrations/azure_sentinel/example_standard_logging_payload.json
@@ -0,0 +1,179 @@
+{
+    "id": "chatcmpl-2299b6a2-82a3-465a-b47c-04e685a2227f",
+    "trace_id": "97311c60-9a61-4f48-a814-70139ee57868",
+    "call_type": "acompletion",
+    "cache_hit": null,
+    "stream": true,
+    "status": "success",
+    "custom_llm_provider": "openai",
+    "saved_cache_cost": 0.0,
+    "startTime": 1766000068.28466,
+    "endTime": 1766000070.07935,
+    "completionStartTime": 1766000070.07935,
+    "response_time": 1.79468512535095,
+    "model": "gpt-4o",
+    "metadata": {
+      "user_api_key_hash": null,
+      "user_api_key_alias": null,
+      "user_api_key_team_id": null,
+      "user_api_key_org_id": null,
+      "user_api_key_user_id": null,
+      "user_api_key_team_alias": null,
+      "user_api_key_user_email": null,
+      "spend_logs_metadata": null,
+      "requester_ip_address": null,
+      "requester_metadata": null,
+      "user_api_key_end_user_id": null,
+      "prompt_management_metadata": null,
+      "applied_guardrails": [],
+      "mcp_tool_call_metadata": null,
+      "vector_store_request_metadata": null,
+      "guardrail_information": null
+    },
+    "cache_key": null,
+    "response_cost": 0.00022500000000000002,
+    "total_tokens": 30,
+    "prompt_tokens": 10,
+    "completion_tokens": 20,
+    "request_tags": [],
+    "end_user": "",
+    "api_base": "",
+    "model_group": "",
+    "model_id": "",
+    "requester_ip_address": null,
+    "messages": [
+      {
+        "role": "user",
+        "content": "Hello, world!"
+      }
+    ],
+    "response": {
+      "id": "chatcmpl-2299b6a2-82a3-465a-b47c-04e685a2227f",
+      "created": 1742855151,
+      "model": "gpt-4o",
+      "object": "chat.completion",
+      "system_fingerprint": null,
+      "choices": [
+        {
+          "finish_reason": "stop",
+          "index": 0,
+          "message": {
+            "content": "hi",
+            "role": "assistant",
+            "tool_calls": null,
+            "function_call": null,
+            "provider_specific_fields": null
+          }
+        }
+      ],
+      "usage": {
+        "completion_tokens": 20,
+        "prompt_tokens": 10,
+        "total_tokens": 30,
+        "completion_tokens_details": null,
+        "prompt_tokens_details": null
+      }
+    },
+    "model_parameters": {},
+    "hidden_params": {
+      "model_id": null,
+      "cache_key": null,
+      "api_base": "https://api.openai.com",
+      "response_cost": 0.00022500000000000002,
+      "additional_headers": {},
+      "litellm_overhead_time_ms": null,
+      "batch_models": null,
+      "litellm_model_name": "gpt-4o"
+    },
+    "model_map_information": {
+      "model_map_key": "gpt-4o",
+      "model_map_value": {
+        "key": "gpt-4o",
+        "max_tokens": 16384,
+        "max_input_tokens": 128000,
+        "max_output_tokens": 16384,
+        "input_cost_per_token": 2.5e-06,
+        "cache_creation_input_token_cost": null,
+        "cache_read_input_token_cost": 1.25e-06,
+        "input_cost_per_character": null,
+        "input_cost_per_token_above_128k_tokens": null,
+        "input_cost_per_query": null,
+        "input_cost_per_second": null,
+        "input_cost_per_audio_token": null,
+        "input_cost_per_token_batches": 1.25e-06,
+        "output_cost_per_token_batches": 5e-06,
+        "output_cost_per_token": 1e-05,
+        "output_cost_per_audio_token": null,
+        "output_cost_per_character": null,
+        "output_cost_per_token_above_128k_tokens": null,
+        "output_cost_per_character_above_128k_tokens": null,
+        "output_cost_per_second": null,
+        "output_cost_per_image": null,
+        "output_vector_size": null,
+        "litellm_provider": "openai",
+        "mode": "chat",
+        "supports_system_messages": true,
+        "supports_response_schema": true,
+        "supports_vision": true,
+        "supports_function_calling": true,
+        "supports_tool_choice": true,
+        "supports_assistant_prefill": false,
+        "supports_prompt_caching": true,
+        "supports_audio_input": false,
+        "supports_audio_output": false,
+        "supports_pdf_input": false,
+        "supports_embedding_image_input": false,
+        "supports_native_streaming": null,
+        "supports_web_search": true,
+        "search_context_cost_per_query": {
+          "search_context_size_low": 0.03,
+          "search_context_size_medium": 0.035,
+          "search_context_size_high": 0.05
+        },
+        "tpm": null,
+        "rpm": null,
+        "supported_openai_params": [
+          "frequency_penalty",
+          "logit_bias",
+          "logprobs",
+          "top_logprobs",
+          "max_tokens",
+          "max_completion_tokens",
+          "modalities",
+          "prediction",
+          "n",
+          "presence_penalty",
+          "seed",
+          "stop",
+          "stream",
+          "stream_options",
+          "temperature",
+          "top_p",
+          "tools",
+          "tool_choice",
+          "function_call",
+          "functions",
+          "max_retries",
+          "extra_headers",
+          "parallel_tool_calls",
+          "audio",
+          "response_format",
+          "user"
+        ]
+      }
+    },
+    "error_str": null,
+    "error_information": {
+      "error_code": "",
+      "error_class": "",
+      "llm_provider": "",
+      "traceback": "",
+      "error_message": ""
+    },
+    "response_cost_failure_debug_info": null,
+    "guardrail_information": null,
+    "standard_built_in_tools_params": {
+      "web_search_options": null,
+      "file_search": null
+    }
+  }