chore: initial public snapshot for github upload

2026-03-26 20:06:14 +08:00
commit 0e5ecd930e
3497 changed files with 1586236 additions and 0 deletions
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/pangea/init.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/pangea/init.py
@@ -0,0 +1,39 @@
+from typing import TYPE_CHECKING
+
+from litellm.types.guardrails import SupportedGuardrailIntegrations
+
+from .pangea import PangeaHandler
+
+if TYPE_CHECKING:
+    from litellm.types.guardrails import Guardrail, LitellmParams
+
+
+def initialize_guardrail(litellm_params: "LitellmParams", guardrail: "Guardrail"):
+    import litellm
+
+    guardrail_name = guardrail.get("guardrail_name")
+    if not guardrail_name:
+        raise ValueError("Pangea guardrail name is required")
+
+    _pangea_callback = PangeaHandler(
+        guardrail_name=guardrail_name,
+        pangea_input_recipe=litellm_params.pangea_input_recipe,
+        pangea_output_recipe=litellm_params.pangea_output_recipe,
+        api_base=litellm_params.api_base,
+        api_key=litellm_params.api_key,
+        event_hook=litellm_params.mode,
+        default_on=litellm_params.default_on,
+    )
+    litellm.logging_callback_manager.add_litellm_callback(_pangea_callback)
+
+    return _pangea_callback
+
+
+guardrail_initializer_registry = {
+    SupportedGuardrailIntegrations.PANGEA.value: initialize_guardrail,
+}
+
+
+guardrail_class_registry = {
+    SupportedGuardrailIntegrations.PANGEA.value: PangeaHandler,
+}
--- a/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/pangea/pangea.py
+++ b/llm-gateway-competitors/litellm-wheel-src/litellm/proxy/guardrails/guardrail_hooks/pangea/pangea.py
@@ -0,0 +1,343 @@
+# litellm/proxy/guardrails/guardrail_hooks/pangea.py
+import os
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Type, cast
+
+from fastapi import HTTPException
+
+from litellm._logging import verbose_proxy_logger
+from litellm.caching.dual_cache import DualCache
+from litellm.integrations.custom_guardrail import (
+    CustomGuardrail,
+    log_guardrail_information,
+)
+from litellm.llms.custom_httpx.http_handler import (
+    get_async_httpx_client,
+    httpxSpecialProvider,
+)
+from litellm.proxy._types import UserAPIKeyAuth
+from litellm.proxy.common_utils.callback_utils import (
+    add_guardrail_to_applied_guardrails_header,
+)
+from litellm.types.guardrails import GuardrailEventHooks
+from litellm.types.utils import (
+    Choices,
+    LLMResponseTypes,
+    ModelResponse,
+    TextCompletionResponse,
+)
+
+if TYPE_CHECKING:
+    from litellm.types.proxy.guardrails.guardrail_hooks.base import GuardrailConfigModel
+
+
+class PangeaGuardrailMissingSecrets(Exception):
+    """Custom exception for missing Pangea secrets."""
+
+    pass
+
+
+class _TextCompletionRequest:
+    def __init__(self, body):
+        self.body = body
+
+    def get_messages(self) -> list[dict]:
+        return [{"role": "user", "content": self.body["prompt"]}]
+
+    # This mutates the original dict, but we'll still return it anyways
+    def update_original_body(self, prompt_messages: list[dict]) -> Any:
+        assert len(prompt_messages) == 1
+        self.body["prompt"] = prompt_messages[0]["content"]
+        return self.body
+
+
+class PangeaHandler(CustomGuardrail):
+    """
+    Pangea AI Guardrail handler to interact with the Pangea AI Guard service.
+
+    This class implements the necessary hooks to call the Pangea AI Guard API
+    for input and output scanning based on the configured recipe.
+    """
+
+    def __init__(
+        self,
+        guardrail_name: str,
+        pangea_input_recipe: Optional[str] = None,
+        pangea_output_recipe: Optional[str] = None,
+        api_key: Optional[str] = None,
+        api_base: Optional[str] = None,
+        **kwargs,
+    ):
+        """
+        Initializes the PangeaHandler.
+
+        Args:
+            guardrail_name (str): The name of the guardrail instance.
+            pangea_recipe (str): The Pangea recipe key to use for scanning.
+            api_key (Optional[str]): The Pangea API key. Reads from PANGEA_API_KEY env var if None.
+            api_base (Optional[str]): The Pangea API base URL. Reads from PANGEA_API_BASE env var or uses default if None.
+            **kwargs: Additional arguments passed to the CustomGuardrail base class.
+        """
+        self.async_handler = get_async_httpx_client(
+            llm_provider=httpxSpecialProvider.GuardrailCallback
+        )
+        self.api_key = api_key or os.environ.get("PANGEA_API_KEY")
+        if not self.api_key:
+            raise PangeaGuardrailMissingSecrets(
+                "Pangea API Key not found. Set PANGEA_API_KEY environment variable or pass it in litellm_params."
+            )
+
+        # Default Pangea base URL if not provided
+        self.api_base = (
+            api_base
+            or os.environ.get("PANGEA_API_BASE")
+            or "https://ai-guard.aws.us.pangea.cloud"
+        )
+        self.pangea_input_recipe = pangea_input_recipe
+        self.pangea_output_recipe = pangea_output_recipe
+
+        supported_event_hooks = [
+            GuardrailEventHooks.pre_call,
+            GuardrailEventHooks.post_call,
+        ]
+
+        # Pass relevant kwargs to the parent class
+        super().__init__(
+            guardrail_name=guardrail_name,
+            supported_event_hooks=supported_event_hooks,
+            **kwargs,
+        )
+        verbose_proxy_logger.debug(
+            f"Initialized Pangea Guardrail: name={guardrail_name}, recipe={pangea_input_recipe}, api_base={self.api_base}"
+        )
+
+    async def _call_pangea_ai_guard(
+        self, api: str, payload: dict, hook_name: str
+    ) -> dict:
+        """
+        Makes the API call to the Pangea AI Guard endpoint.
+        The function itself will raise an error in the case that a response
+        should be blocked, but will return a list of redacted messages that the caller
+        should act on.
+
+        Args:
+            api (str): Which API to use (text/guard or v1beta/guard)
+            payload (dict): The request payload.
+            request_data (dict): Original request data (used for logging/headers).
+            hook_name (str): Name of the hook calling this function (for logging).
+
+        Raises:
+            HTTPException: If the Pangea API returns a 'blocked: true' response.
+            Exception: For other API call failures.
+
+        Returns:
+            list[dict]: The original response body
+        """
+        endpoint = f"{self.api_base}/{api}"
+
+        headers = {
+            "Authorization": f"Bearer {self.api_key}",
+            "Content-Type": "application/json",
+        }
+
+        verbose_proxy_logger.debug(
+            f"Pangea Guardrail ({hook_name}): Calling endpoint {endpoint} with payload: {payload}"
+        )
+
+        response = await self.async_handler.post(
+            url=endpoint, json=payload, headers=headers
+        )
+        response.raise_for_status()
+
+        result = response.json()
+
+        if result.get("result", {}).get("blocked"):
+            verbose_proxy_logger.warning(
+                f"Pangea Guardrail ({hook_name}): Request blocked. Response: {result}"
+            )
+            raise HTTPException(
+                status_code=400,  # Bad Request, indicating violation
+                detail={
+                    "error": "Violated Pangea guardrail policy",
+                    "guardrail_name": self.guardrail_name,
+                },
+            )
+        verbose_proxy_logger.debug(
+            f"Pangea Guardrail ({hook_name}): Request passed. Response: {result.get('result', {}).get('detectors')}"
+        )
+
+        return result
+
+    async def _async_pre_call_hook(
+        self,
+        user_api_key_dict: UserAPIKeyAuth,
+        cache: DualCache,
+        data: dict,
+        call_type: str,
+    ):
+        transformer = None
+        messages: Any = None
+        if call_type == "text_completion" or call_type == "atext_completion":
+            transformer = _TextCompletionRequest(data)
+            messages = transformer.get_messages()
+        else:
+            messages = data.get("messages")
+
+        ai_guard_payload = {
+            "debug": False,
+            "input": {"messages": messages, "tools": data.get("tools")},  # type: ignore
+            "event_type": "input",
+        }
+        if self.pangea_input_recipe:
+            ai_guard_payload["recipe"] = self.pangea_input_recipe
+
+        ai_guard_response = await self._call_pangea_ai_guard(
+            "v1beta/guard", ai_guard_payload, "async_pre_call_hook"
+        )
+        add_guardrail_to_applied_guardrails_header(
+            request_data=data, guardrail_name=self.guardrail_name
+        )
+
+        if not ai_guard_response.get("result", {}).get("transformed"):
+            return
+
+        output = ai_guard_response.get("result", {}).get("output", {})
+        if call_type == "text_completion" or call_type == "atext_completion":
+            data = transformer.update_original_body(output["messages"])  # type: ignore
+        else:
+            data["messages"] = output["messages"]
+        return data
+
+    @log_guardrail_information
+    async def async_pre_call_hook(
+        self,
+        user_api_key_dict: UserAPIKeyAuth,
+        cache: DualCache,
+        data: dict,
+        call_type: str,
+    ):
+        event_type = GuardrailEventHooks.pre_call
+        if self.should_run_guardrail(data=data, event_type=event_type) is not True:
+            verbose_proxy_logger.debug(
+                f"Pangea Guardrail (async_pre_call_hook): Guardrail is disabled {self.guardrail_name}."
+            )
+            return data
+
+        try:
+            return await self._async_pre_call_hook(
+                user_api_key_dict, cache, data, call_type
+            )
+        except HTTPException:
+            raise
+        except Exception as e:
+            raise HTTPException(
+                status_code=500,
+                detail={
+                    "error": "Error in Pangea Guardrail",
+                    "guardrail_name": self.guardrail_name,
+                    "exceptions": str(e),
+                },
+            ) from e
+
+    async def _async_post_call_success_hook(
+        self,
+        data: dict,
+        user_api_key_dict: UserAPIKeyAuth,
+        # This union isn't actually correct -- it can get other response types depending on the API called
+        response: LLMResponseTypes,
+    ):
+        if isinstance(response, TextCompletionResponse):
+            # Assume the earlier call type as well
+            input_messages = _TextCompletionRequest(data).get_messages()
+        elif isinstance(response, ModelResponse):
+            messages = data.get("messages")
+            if messages is None:
+                return  # No messages to check
+            input_messages = cast(List[Dict[Any, Any]], messages)
+        else:
+            return
+
+        if choices := response.get("choices"):
+            if isinstance(choices, list):
+                serialized_choices = []
+                for c in choices:
+                    if isinstance(c, Choices):
+                        try:
+                            serialized_choices.append(c.model_dump())
+                        except Exception:
+                            serialized_choices.append(c.dict())
+                    else:
+                        serialized_choices.append(c)
+                choices = serialized_choices
+
+        ai_guard_payload = {
+            "debug": False,
+            "input": {
+                "messages": input_messages,
+                "tools": data.get("tools"),
+                "choices": choices,
+            },
+            "event_type": "output",
+        }
+
+        if self.pangea_output_recipe:
+            ai_guard_payload["recipe"] = self.pangea_output_recipe
+
+        ai_guard_response = await self._call_pangea_ai_guard(
+            "v1beta/guard", ai_guard_payload, "async_pre_call_hook"
+        )
+        add_guardrail_to_applied_guardrails_header(
+            request_data=data, guardrail_name=self.guardrail_name
+        )
+
+        if not ai_guard_response.get("result", {}).get("transformed"):
+            return
+
+        output = ai_guard_response.get("result", {}).get("output", {})
+        response.choices = output["choices"]
+        return response
+
+    @log_guardrail_information
+    async def async_post_call_success_hook(
+        self,
+        data: dict,
+        user_api_key_dict: UserAPIKeyAuth,
+        # This union isn't actually correct -- it can get other response types depending on the API called
+        response: LLMResponseTypes,
+    ):
+        """
+        Guardrail hook run after a successful LLM call (scans output).
+
+        Args:
+            data (dict): The original request data.
+            user_api_key_dict (UserAPIKeyAuth): User API key details.
+            response (LLMResponseTypes): The response object from the LLM call.
+        """
+        event_type = GuardrailEventHooks.post_call
+        if self.should_run_guardrail(data=data, event_type=event_type) is not True:
+            verbose_proxy_logger.debug(
+                f"Pangea Guardrail (async_pre_call_hook): Guardrail is disabled {self.guardrail_name}."
+            )
+            return data
+        try:
+            return await self._async_post_call_success_hook(
+                data, user_api_key_dict, response
+            )
+        except HTTPException:
+            raise
+        except Exception as e:
+            raise HTTPException(
+                status_code=500,
+                detail={
+                    "error": "Error in Pangea Guardrail",
+                    "guardrail_name": self.guardrail_name,
+                    "exceptions": str(e),
+                },
+            ) from e
+
+    @staticmethod
+    def get_config_model() -> Optional[Type["GuardrailConfigModel"]]:
+        from litellm.types.proxy.guardrails.guardrail_hooks.pangea import (
+            PangeaGuardrailConfigModel,
+        )
+
+        return PangeaGuardrailConfigModel