litellm/tests/test_litellm/proxy/test_proxy_server.py

import asyncio
import importlib
import json
import os
import socket
import subprocess
import sys
from datetime import datetime, timezone
from pathlib import Path
from unittest import mock
from unittest.mock import AsyncMock, MagicMock, mock_open, patch

import click
import httpx
import pytest
import yaml
from fastapi import FastAPI
from fastapi.staticfiles import StaticFiles
from fastapi.testclient import TestClient

sys.path.insert(
    0, os.path.abspath("../../..")
)  # Adds the parent directory to the system-path

import litellm
from litellm.proxy.auth.user_api_key_auth import user_api_key_auth
from litellm.proxy.proxy_server import app, initialize

example_embedding_result = {
    "object": "list",
    "data": [
        {
            "object": "embedding",
            "index": 0,
            "embedding": [
                -0.006929283495992422,
                -0.005336422007530928,
                -4.547132266452536e-05,
                -0.024047505110502243,
                -0.006929283495992422,
                -0.005336422007530928,
                -4.547132266452536e-05,
                -0.024047505110502243,
                -0.006929283495992422,
                -0.005336422007530928,
                -4.547132266452536e-05,
                -0.024047505110502243,
            ],
        }
    ],
    "model": "text-embedding-3-small",
    "usage": {"prompt_tokens": 5, "total_tokens": 5},
}


def mock_patch_aembedding():
    return mock.patch(
        "litellm.proxy.proxy_server.llm_router.aembedding",
        return_value=example_embedding_result,
    )


@pytest.fixture(scope="function")
def client_no_auth():
    # Assuming litellm.proxy.proxy_server is an object
    from litellm.proxy.proxy_server import cleanup_router_config_variables

    cleanup_router_config_variables()
    filepath = os.path.dirname(os.path.abspath(__file__))
    config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
    # initialize can get run in parallel, it sets specific variables for the fast api app, sinc eit gets run in parallel different tests use the wrong variables
    asyncio.run(initialize(config=config_fp, debug=True))
    return TestClient(app)


def test_login_v2_returns_redirect_url_and_sets_cookie(monkeypatch):
    mock_login_result = {"user_id": "test-user"}
    mock_prisma_client = MagicMock()
    mock_authenticate_user = AsyncMock(return_value=mock_login_result)
    mock_create_ui_token_object = MagicMock(return_value={"user_id": "test-user"})
    mock_jwt_encode = MagicMock(return_value="signed-token")

    monkeypatch.setattr(
        "litellm.proxy.auth.login_utils.authenticate_user",
        mock_authenticate_user,
    )
    monkeypatch.setattr(
        "litellm.proxy.auth.login_utils.create_ui_token_object",
        mock_create_ui_token_object,
    )
    monkeypatch.setattr("jwt.encode", mock_jwt_encode)
    monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key")
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.premium_user", False)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.utils.get_server_root_path", lambda: "")

    client = TestClient(app)
    response = client.post(
        "/v2/login",
        json={"username": "alice", "password": "secret"},
    )

    assert response.status_code == 200
    assert (
        response.json()
        == {"redirect_url": "http://testserver/ui/?login=success"}
    )
    assert response.cookies.get("token") == "signed-token"

    mock_authenticate_user.assert_awaited_once_with(
        username="alice",
        password="secret",
        master_key="test-master-key",
        prisma_client=mock_prisma_client,
    )
    mock_create_ui_token_object.assert_called_once_with(
        login_result=mock_login_result,
        general_settings={},
        premium_user=False,
    )
    mock_jwt_encode.assert_called_once_with(
        {"user_id": "test-user"},
        "test-master-key",
        algorithm="HS256",
    )


def test_login_v2_returns_json_on_proxy_exception(monkeypatch):
    """Test that /v2/login returns JSON error when ProxyException is raised"""
    from litellm.proxy._types import ProxyErrorTypes, ProxyException

    mock_prisma_client = MagicMock()
    mock_authenticate_user = AsyncMock(
        side_effect=ProxyException(
            message="Invalid credentials",
            type=ProxyErrorTypes.auth_error,
            param="password",
            code=401,
        )
    )

    monkeypatch.setattr(
        "litellm.proxy.auth.login_utils.authenticate_user",
        mock_authenticate_user,
    )
    monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key")
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)

    client = TestClient(app)
    response = client.post(
        "/v2/login",
        json={"username": "alice", "password": "wrong"},
    )

    assert response.status_code == 401
    assert response.headers["content-type"] == "application/json"
    data = response.json()
    assert "error" in data
    assert data["error"]["message"] == "Invalid credentials"
    assert data["error"]["type"] == "auth_error"


def test_login_v2_returns_json_on_http_exception(monkeypatch):
    """Test that /v2/login converts HTTPException to JSON error response"""
    from fastapi import HTTPException

    mock_prisma_client = MagicMock()
    mock_authenticate_user = AsyncMock(
        side_effect=HTTPException(status_code=401, detail="Unauthorized")
    )

    monkeypatch.setattr(
        "litellm.proxy.auth.login_utils.authenticate_user",
        mock_authenticate_user,
    )
    monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key")
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)

    client = TestClient(app)
    response = client.post(
        "/v2/login",
        json={"username": "alice", "password": "secret"},
    )

    assert response.status_code == 401
    assert response.headers["content-type"] == "application/json"
    data = response.json()
    assert "error" in data
    assert isinstance(data["error"], dict)


def test_login_v2_returns_json_on_unexpected_exception(monkeypatch):
    """Test that /v2/login returns JSON error when unexpected exception occurs"""
    mock_prisma_client = MagicMock()
    mock_authenticate_user = AsyncMock(side_effect=ValueError("Unexpected error"))

    monkeypatch.setattr(
        "litellm.proxy.auth.login_utils.authenticate_user",
        mock_authenticate_user,
    )
    monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key")
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)

    client = TestClient(app)
    response = client.post(
        "/v2/login",
        json={"username": "alice", "password": "secret"},
    )

    assert response.status_code == 500
    assert response.headers["content-type"] == "application/json"
    data = response.json()
    assert "error" in data
    assert isinstance(data["error"], dict)
    assert "Unexpected error" in data["error"]["message"]


def test_login_v2_returns_json_on_invalid_json_body(monkeypatch):
    """Test that /v2/login returns JSON error when request body is invalid JSON"""
    monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key")

    client = TestClient(app)
    response = client.post(
        "/v2/login",
        content="invalid json",
        headers={"Content-Type": "application/json"},
    )

    assert response.status_code == 500
    assert response.headers["content-type"] == "application/json"
    data = response.json()
    assert "error" in data
    assert isinstance(data["error"], dict)


def test_fallback_login_has_no_deprecation_banner(client_no_auth):
    response = client_no_auth.get("/fallback/login")

    assert response.status_code == 200
    html = response.text
    assert '<div class="deprecation-banner">' not in html
    assert "Deprecated:" not in html
    assert "<form" in html


def test_sso_key_generate_shows_deprecation_banner(client_no_auth, monkeypatch):
    # Ensure the route returns the HTML form instead of redirecting
    monkeypatch.setattr(
        "litellm.proxy.management_endpoints.ui_sso.show_missing_vars_in_env",
        lambda: None,
    )
    monkeypatch.setattr(
        "litellm.proxy.management_endpoints.ui_sso.SSOAuthenticationHandler.get_redirect_url_for_sso",
        lambda *args, **kwargs: "http://test/redirect",
    )
    monkeypatch.setattr(
        "litellm.proxy.management_endpoints.ui_sso.SSOAuthenticationHandler._get_cli_state",
        lambda *args, **kwargs: None,
    )
    monkeypatch.setattr(
        "litellm.proxy.management_endpoints.ui_sso.SSOAuthenticationHandler.should_use_sso_handler",
        lambda *args, **kwargs: False,
    )
    monkeypatch.setenv("UI_USERNAME", "admin")

    response = client_no_auth.get("/sso/key/generate")

    assert response.status_code == 200
    html = response.text
    assert '<div class="deprecation-banner">' in html
    assert "Deprecated:" in html


def test_restructure_ui_html_files_handles_nested_routes(tmp_path):
    """
    Test that _restructure_ui_html_files correctly restructures HTML files.
    Note: This function is always called now, both in development and non-root Docker environments.
    """
    from litellm.proxy import proxy_server

    ui_root = tmp_path / "ui"
    ui_root.mkdir()

    def write_file(path: Path, content: str) -> None:
        path.parent.mkdir(parents=True, exist_ok=True)
        path.write_text(content)

    write_file(ui_root / "home.html", "home")
    write_file(ui_root / "mcp" / "oauth" / "callback.html", "callback")
    write_file(ui_root / "existing" / "index.html", "keep")
    write_file(ui_root / "_next" / "ignore.html", "asset")
    write_file(ui_root / "litellm-asset-prefix" / "ignore.html", "asset")

    proxy_server._restructure_ui_html_files(str(ui_root))

    assert not (ui_root / "home.html").exists()
    assert (ui_root / "home" / "index.html").read_text() == "home"
    assert not (ui_root / "mcp" / "oauth" / "callback.html").exists()
    assert (
        (ui_root / "mcp" / "oauth" / "callback" / "index.html").read_text()
        == "callback"
    )
    assert (ui_root / "existing" / "index.html").read_text() == "keep"
    assert (ui_root / "_next" / "ignore.html").read_text() == "asset"
    assert (
        (ui_root / "litellm-asset-prefix" / "ignore.html").read_text()
        == "asset"
    )


def test_ui_extensionless_route_requires_restructure(tmp_path):
    """
    Regression for non-root fallback: /ui/login expects login/index.html.
    Note: Restructuring always happens now, both in development and non-root Docker environments.
    """

    from litellm.proxy import proxy_server

    ui_root = tmp_path / "ui"
    ui_root.mkdir()
    (ui_root / "index.html").write_text("index")
    (ui_root / "login.html").write_text("login")

    fastapi_app = FastAPI()
    fastapi_app.mount(
        "/ui", StaticFiles(directory=str(ui_root), html=True), name="ui"
    )
    client = TestClient(fastapi_app)

    assert client.get("/ui/login.html").status_code == 200
    assert client.get("/ui/login").status_code == 404

    proxy_server._restructure_ui_html_files(str(ui_root))

    response = client.get("/ui/login")
    assert response.status_code == 200
    assert "login" in response.text


def test_restructure_always_happens(monkeypatch):
    """
    Test that restructuring logic always executes regardless of LITELLM_NON_ROOT setting.
    In development (is_non_root=False), restructuring happens directly in _experimental/out.
    In non-root Docker (is_non_root=True), restructuring happens in /var/lib/litellm/ui.
    """
    # Test Case 1: is_non_root is True - restructuring happens in /var/lib/litellm/ui
    monkeypatch.setenv("LITELLM_NON_ROOT", "true")

    runtime_ui_path = "/var/lib/litellm/ui"
    packaged_ui_path = "/some/packaged/ui/path"

    # Simulate the logic from proxy_server.py
    is_non_root = os.getenv("LITELLM_NON_ROOT", "").lower() == "true"
    if is_non_root:
        ui_path = runtime_ui_path
    else:
        ui_path = packaged_ui_path

    # Restructuring always happens now, regardless of ui_path vs packaged_ui_path
    should_restructure = True

    assert is_non_root is True
    assert should_restructure is True
    assert ui_path == runtime_ui_path

    # Test Case 2: is_non_root is False - restructuring happens directly in packaged_ui_path
    monkeypatch.delenv("LITELLM_NON_ROOT", raising=False)

    # Simulate the logic from proxy_server.py
    is_non_root = os.getenv("LITELLM_NON_ROOT", "").lower() == "true"
    if is_non_root:
        ui_path = runtime_ui_path
    else:
        ui_path = packaged_ui_path

    # Restructuring always happens now, even when ui_path == packaged_ui_path
    should_restructure = True

    assert is_non_root is False
    assert should_restructure is True
    assert ui_path == packaged_ui_path


@pytest.mark.asyncio
async def test_initialize_scheduled_jobs_credentials(monkeypatch):
    """
    Test that get_credentials is only called when store_model_in_db is True
    """
    monkeypatch.delenv("DISABLE_PRISMA_SCHEMA_UPDATE", raising=False)
    monkeypatch.delenv("STORE_MODEL_IN_DB", raising=False)
    from litellm.proxy.proxy_server import ProxyStartupEvent
    from litellm.proxy.utils import ProxyLogging

    # Mock dependencies
    mock_prisma_client = MagicMock()
    mock_proxy_logging = MagicMock(spec=ProxyLogging)
    mock_proxy_logging.slack_alerting_instance = MagicMock()
    mock_proxy_config = AsyncMock()

    with patch("litellm.proxy.proxy_server.proxy_config", mock_proxy_config), patch(
        "litellm.proxy.proxy_server.store_model_in_db", False
    ):  # set store_model_in_db to False
        # Test when store_model_in_db is False
        await ProxyStartupEvent.initialize_scheduled_background_jobs(
            general_settings={},
            prisma_client=mock_prisma_client,
            proxy_budget_rescheduler_min_time=1,
            proxy_budget_rescheduler_max_time=2,
            proxy_batch_write_at=5,
            proxy_logging_obj=mock_proxy_logging,
        )

        # Verify get_credentials was not called
        mock_proxy_config.get_credentials.assert_not_called()

    # Now test with store_model_in_db = True
    with patch("litellm.proxy.proxy_server.proxy_config", mock_proxy_config), patch(
        "litellm.proxy.proxy_server.store_model_in_db", True
    ), patch("litellm.proxy.proxy_server.get_secret_bool", return_value=True):
        await ProxyStartupEvent.initialize_scheduled_background_jobs(
            general_settings={},
            prisma_client=mock_prisma_client,
            proxy_budget_rescheduler_min_time=1,
            proxy_budget_rescheduler_max_time=2,
            proxy_batch_write_at=5,
            proxy_logging_obj=mock_proxy_logging,
        )

        # Verify get_credentials was called both directly and scheduled
        assert mock_proxy_config.get_credentials.call_count == 1  # Direct call

        # Verify a scheduled job was added for get_credentials
        mock_scheduler_calls = [
            call[0] for call in mock_proxy_config.get_credentials.mock_calls
        ]
        assert len(mock_scheduler_calls) > 0


def test_update_config_fields_deep_merge_db_wins():
    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    current_config = {
        "router_settings": {
            "routing_mode": "cost_optimized",
            "model_group_alias": {
                # Existing alias with older model + different hidden flag
                "claude-sonnet-4": {
                    "model": "claude-sonnet-4-20240219",
                    "hidden": True,
                },
                # An extra alias that should remain untouched unless DB overrides it
                "legacy-sonnet": {
                    "model": "claude-2.1",
                    "hidden": True,
                },
            },
        }
    }

    db_param_value = {
        "model_group_alias": {
            # Conflict: DB should win (both 'model' and 'hidden')
            "claude-sonnet-4": {
                "model": "claude-sonnet-4-20250514",
                "hidden": False,
            },
            # New alias to be added by the merge
            "claude-sonnet-latest": {
                "model": "claude-sonnet-4-20250514",
                "hidden": True,
            },
            # Demonstrate that None values from DB are skipped (preserve existing)
            "legacy-sonnet": {
                "hidden": None  # should not clobber current True
            },
        }
    }

    updated = proxy_config._update_config_fields(
        current_config=current_config,
        param_name="router_settings",
        db_param_value=db_param_value,
    )

    rs = updated["router_settings"]
    aliases = rs["model_group_alias"]

    # DB wins on conflicts (deep) for existing alias
    assert aliases["claude-sonnet-4"]["model"] == "claude-sonnet-4-20250514"
    assert aliases["claude-sonnet-4"]["hidden"] is False

    # New alias introduced by DB is present with its values
    assert "claude-sonnet-latest" in aliases
    assert aliases["claude-sonnet-latest"]["model"] == "claude-sonnet-4-20250514"
    assert aliases["claude-sonnet-latest"]["hidden"] is True

    # None in DB does not overwrite existing values
    assert aliases["legacy-sonnet"]["model"] == "claude-2.1"
    assert aliases["legacy-sonnet"]["hidden"] is True

    # Unrelated router_settings keys are preserved
    assert rs["routing_mode"] == "cost_optimized"


def test_get_config_custom_callback_api_env_vars(monkeypatch):
    """
    Ensure /get/config/callbacks returns custom callback env vars when both custom values are provided.
    """
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Mock config with custom_callback_api enabled and generic logger env vars present
    config_data = {
        "litellm_settings": {"success_callback": ["custom_callback_api"]},
        "general_settings": {},
        "environment_variables": {
            "GENERIC_LOGGER_ENDPOINT": "https://callback.example.com",
            "GENERIC_LOGGER_HEADERS": "Auth: token",
        },
    }

    # Mock proxy_config.get_config and router settings
    mock_router = MagicMock()
    mock_router.get_settings.return_value = {}
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr(
        proxy_config, "get_config", AsyncMock(return_value=config_data)
    )

    # Bypass auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: MagicMock()

    client = TestClient(app)
    try:
        response = client.get("/get/config/callbacks")
    finally:
        app.dependency_overrides = original_overrides

    assert response.status_code == 200
    callbacks = response.json()["callbacks"]
    custom_cb = next(
        (cb for cb in callbacks if cb["name"] == "custom_callback_api"), None
    )

    assert custom_cb is not None
    assert custom_cb["variables"] == {
        "GENERIC_LOGGER_ENDPOINT": "https://callback.example.com",
        "GENERIC_LOGGER_HEADERS": "Auth: token",
    }


# Mock Prisma
class MockPrisma:
    def __init__(self, database_url=None, proxy_logging_obj=None, http_client=None):
        self.database_url = database_url
        self.proxy_logging_obj = proxy_logging_obj
        self.http_client = http_client

    async def connect(self):
        pass

    async def disconnect(self):
        pass


mock_prisma = MockPrisma()


@patch(
    "litellm.proxy.proxy_server.ProxyStartupEvent._setup_prisma_client",
    return_value=mock_prisma,
)
@pytest.mark.asyncio
async def test_aaaproxy_startup_master_key(mock_prisma, monkeypatch, tmp_path):
    """
    Test that master_key is correctly loaded from either config.yaml or environment variables
    """
    import yaml
    from fastapi import FastAPI

    # Import happens here - this is when the module probably reads the config path
    from litellm.proxy.proxy_server import proxy_startup_event

    # Mock the Prisma import
    monkeypatch.setattr("litellm.proxy.proxy_server.PrismaClient", MockPrisma)

    # Create test app
    app = FastAPI()

    # Test Case 1: Master key from config.yaml
    test_master_key = "sk-12345"
    test_config = {"general_settings": {"master_key": test_master_key}}

    # Create a temporary config file
    config_path = tmp_path / "config.yaml"
    with open(config_path, "w") as f:
        yaml.dump(test_config, f)

    print(f"SET ENV VARIABLE - CONFIG_FILE_PATH, str(config_path): {str(config_path)}")
    # Second setting of CONFIG_FILE_PATH to a different value
    monkeypatch.setenv("CONFIG_FILE_PATH", str(config_path))
    print(f"config_path: {config_path}")
    print(f"os.getenv('CONFIG_FILE_PATH'): {os.getenv('CONFIG_FILE_PATH')}")
    async with proxy_startup_event(app):
        from litellm.proxy.proxy_server import master_key

        assert master_key == test_master_key

    # Test Case 2: Master key from environment variable
    test_env_master_key = "sk-test-67890"

    # Create empty config
    empty_config = {"general_settings": {}}
    with open(config_path, "w") as f:
        yaml.dump(empty_config, f)

    monkeypatch.setenv("LITELLM_MASTER_KEY", test_env_master_key)
    print("test_env_master_key: {}".format(test_env_master_key))
    async with proxy_startup_event(app):
        from litellm.proxy.proxy_server import master_key

        assert master_key == test_env_master_key

    # Test Case 3: Master key with os.environ prefix
    test_resolved_key = "sk-resolved-key"
    test_config_with_prefix = {
        "general_settings": {"master_key": "os.environ/CUSTOM_MASTER_KEY"}
    }

    # Create config with os.environ prefix
    with open(config_path, "w") as f:
        yaml.dump(test_config_with_prefix, f)

    monkeypatch.setenv("CUSTOM_MASTER_KEY", test_resolved_key)
    async with proxy_startup_event(app):
        from litellm.proxy.proxy_server import master_key

        assert master_key == test_resolved_key


def test_team_info_masking():
    """
    Test that sensitive team information is properly masked

    Ref: https://huntr.com/bounties/661b388a-44d8-4ad5-862b-4dc5b80be30a
    """
    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()
    # Test team object with sensitive data
    team1_info = {
        "success_callback": "['langfuse', 's3']",
        "langfuse_secret": "secret-test-key",
        "langfuse_public_key": "public-test-key",
    }

    with pytest.raises(Exception) as exc_info:
        proxy_config._get_team_config(
            team_id="test_dev",
            all_teams_config=[team1_info],
        )

    print("Got exception: {}".format(exc_info.value))
    assert "secret-test-key" not in str(exc_info.value)
    assert "public-test-key" not in str(exc_info.value)


@mock_patch_aembedding()
def test_embedding_input_array_of_tokens(mock_aembedding, client_no_auth):
    """
    Test to bypass decoding input as array of tokens for selected providers

    Ref: https://github.com/BerriAI/litellm/issues/10113
    """
    try:
        test_data = {
            "model": "vllm_embed_model",
            "input": [[2046, 13269, 158208]],
        }

        response = client_no_auth.post("/v1/embeddings", json=test_data)

        # DEPRECATED - mock_aembedding.assert_called_once_with is too strict, and will fail when new kwargs are added to embeddings
        # mock_aembedding.assert_called_once_with(
        #     model="vllm_embed_model",
        #     input=[[2046, 13269, 158208]],
        #     metadata=mock.ANY,
        #     proxy_server_request=mock.ANY,
        #     secret_fields=mock.ANY,
        # )
        # Assert that aembedding was called, and that input was not modified
        mock_aembedding.assert_called_once()
        call_args, call_kwargs = mock_aembedding.call_args
        assert call_kwargs["model"] == "vllm_embed_model"
        assert call_kwargs["input"] == [[2046, 13269, 158208]]

        assert response.status_code == 200
        result = response.json()
        print(len(result["data"][0]["embedding"]))
        assert len(result["data"][0]["embedding"]) > 10  # this usually has len==1536 so
    except Exception as e:
        pytest.fail(f"LiteLLM Proxy test failed. Exception - {str(e)}")


@pytest.mark.asyncio
async def test_get_all_team_models():
    """
    Test get_all_team_models function with both "*" and specific team IDs
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import LiteLLM_TeamTable
    from litellm.proxy.proxy_server import get_all_team_models

    # Mock team data
    mock_team1 = MagicMock()
    mock_team1.model_dump.return_value = {
        "team_id": "team1",
        "models": ["gpt-4", "gpt-3.5-turbo"],
        "team_alias": "Team 1",
    }

    mock_team2 = MagicMock()
    mock_team2.model_dump.return_value = {
        "team_id": "team2",
        "models": ["claude-3", "gpt-4"],
        "team_alias": "Team 2",
    }

    # Mock model data returned by router
    mock_models_gpt4 = [
        {"model_info": {"id": "gpt-4-model-1"}},
        {"model_info": {"id": "gpt-4-model-2"}},
    ]
    mock_models_gpt35 = [
        {"model_info": {"id": "gpt-3.5-turbo-model-1"}},
    ]
    mock_models_claude = [
        {"model_info": {"id": "claude-3-model-1"}},
    ]

    # Mock prisma client
    mock_prisma_client = MagicMock()
    mock_db = MagicMock()
    mock_litellm_teamtable = MagicMock()

    mock_prisma_client.db = mock_db
    mock_db.litellm_teamtable = mock_litellm_teamtable

    # Make find_many async
    mock_litellm_teamtable.find_many = AsyncMock()

    # Mock router
    mock_router = MagicMock()

    def mock_get_model_list(model_name, team_id=None):
        if model_name == "gpt-4":
            return mock_models_gpt4
        elif model_name == "gpt-3.5-turbo":
            return mock_models_gpt35
        elif model_name == "claude-3":
            return mock_models_claude
        return None

    mock_router.get_model_list.side_effect = mock_get_model_list

    # Test Case 1: user_teams = "*" (all teams)
    mock_litellm_teamtable.find_many.return_value = [mock_team1, mock_team2]

    with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class:
        # Configure the mock class to return proper instances
        def mock_team_table_constructor(**kwargs):
            mock_instance = MagicMock()
            mock_instance.team_id = kwargs["team_id"]
            mock_instance.models = kwargs["models"]
            return mock_instance

        mock_team_table_class.side_effect = mock_team_table_constructor

        result = await get_all_team_models(
            user_teams="*",
            prisma_client=mock_prisma_client,
            llm_router=mock_router,
        )

        # Verify find_many was called without where clause for "*"
        mock_litellm_teamtable.find_many.assert_called_with()

        # Verify router.get_model_list was called for each model
        expected_calls = [
            mock.call(model_name="gpt-4", team_id="team1"),
            mock.call(model_name="gpt-3.5-turbo", team_id="team1"),
            mock.call(model_name="claude-3", team_id="team2"),
            mock.call(model_name="gpt-4", team_id="team2"),
        ]
        mock_router.get_model_list.assert_has_calls(expected_calls, any_order=True)

    # Test Case 2: user_teams = specific list
    mock_litellm_teamtable.reset_mock()
    mock_router.reset_mock()
    mock_router.get_model_list.side_effect = mock_get_model_list

    # Only return team1 for specific team query
    mock_litellm_teamtable.find_many.return_value = [mock_team1]

    with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class:
        mock_team_table_class.side_effect = mock_team_table_constructor

        result = await get_all_team_models(
            user_teams=["team1"],
            prisma_client=mock_prisma_client,
            llm_router=mock_router,
        )

        # Verify find_many was called with where clause for specific teams
        mock_litellm_teamtable.find_many.assert_called_with(
            where={"team_id": {"in": ["team1"]}}
        )

        # Verify router.get_model_list was called only for team1 models
        expected_calls = [
            mock.call(model_name="gpt-4", team_id="team1"),
            mock.call(model_name="gpt-3.5-turbo", team_id="team1"),
        ]
        mock_router.get_model_list.assert_has_calls(expected_calls, any_order=True)

    # Test Case 3: Empty teams list
    mock_litellm_teamtable.reset_mock()
    mock_router.reset_mock()
    mock_litellm_teamtable.find_many.return_value = []

    result = await get_all_team_models(
        user_teams=[],
        prisma_client=mock_prisma_client,
        llm_router=mock_router,
    )

    # Verify find_many was called with empty list
    mock_litellm_teamtable.find_many.assert_called_with(where={"team_id": {"in": []}})

    # Should return empty list when no teams
    assert result == {}

    # Test Case 4: Router returns None for some models
    mock_litellm_teamtable.reset_mock()
    mock_router.reset_mock()
    mock_litellm_teamtable.find_many.return_value = [mock_team1]

    def mock_get_model_list_with_none(model_name, team_id=None):
        if model_name == "gpt-4":
            return mock_models_gpt4
        # Return None for gpt-3.5-turbo to test None handling
        return None

    mock_router.get_model_list.side_effect = mock_get_model_list_with_none

    with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class:
        mock_team_table_class.side_effect = mock_team_table_constructor

        result = await get_all_team_models(
            user_teams=["team1"],
            prisma_client=mock_prisma_client,
            llm_router=mock_router,
        )

        # Should handle None return gracefully
        assert isinstance(result, dict)
        print("result: ", result)
        assert result == {"gpt-4-model-1": ["team1"], "gpt-4-model-2": ["team1"]}


def test_add_team_models_to_all_models():
    """
    Test add_team_models_to_all_models function
    """
    from litellm.proxy._types import LiteLLM_TeamTable
    from litellm.proxy.proxy_server import _add_team_models_to_all_models

    team_db_objects_typed = MagicMock(spec=LiteLLM_TeamTable)
    team_db_objects_typed.team_id = "team1"
    team_db_objects_typed.models = ["all-proxy-models"]

    llm_router = MagicMock()
    llm_router.get_model_list.return_value = [
        {"model_info": {"id": "gpt-4-model-1", "team_id": "team2"}},
        {"model_info": {"id": "gpt-4-model-2"}},
    ]

    result = _add_team_models_to_all_models(
        team_db_objects_typed=[team_db_objects_typed],
        llm_router=llm_router,
    )
    assert result == {"gpt-4-model-2": {"team1"}}


@pytest.mark.asyncio
async def test_delete_deployment_type_mismatch():
    """
    Test that the _delete_deployment function handles type mismatches correctly.
    Specifically test that models 12345678 and 12345679 are NOT deleted when
    they exist in both combined_id_list (as integers) and router_model_ids (as strings).

    This test reproduces the bug where type mismatch causes valid models to be deleted.
    """
    from unittest.mock import MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    # Create mock ProxyConfig instance
    pc = ProxyConfig()

    pc.get_config = MagicMock(
        return_value={
            "model_list": [
                {
                    "model_name": "openai-gpt-4o",
                    "litellm_params": {"model": "gpt-4o"},
                    "model_info": {"id": 12345678},
                },
                {
                    "model_name": "openai-gpt-4o",
                    "litellm_params": {"model": "gpt-4o"},
                    "model_info": {"id": 12345679},
                },
            ]
        }
    )

    # Mock llm_router with string IDs (this is the source of the type mismatch)
    mock_llm_router = MagicMock()
    mock_llm_router.get_model_ids.return_value = [
        "a96e12e76b36a57cfae57a41288eb41567629cac89b4828c6f7074afc3534695",
        "a40186dd0fdb9b7282380277d7f57044d29de95bfbfcd7f4322b3493702d5cd3",
        "12345678",  # String ID
        "12345679",  # String ID
    ]

    # Track which deployments were deleted
    deleted_ids = []

    def mock_delete_deployment(id):
        deleted_ids.append(id)
        return True  # Simulate successful deletion

    mock_llm_router.delete_deployment = MagicMock(side_effect=mock_delete_deployment)

    # Mock get_config to return empty config (no config models)
    async def mock_get_config(config_file_path):
        return {}

    pc.get_config = MagicMock(side_effect=mock_get_config)

    # Patch the global llm_router
    with patch("litellm.proxy.proxy_server.llm_router", mock_llm_router), patch(
        "litellm.proxy.proxy_server.user_config_file_path", "test_config.yaml"
    ):

        # Call the function under test
        deleted_count = await pc._delete_deployment(db_models=[])

        # Assertions: Models 12345678 and 12345679 should NOT be deleted
        # because they exist in combined_id_list (as integers) even though
        # router has them as strings

        # The function should delete the other 2 models that are not in combined_id_list
        assert deleted_count == 0, f"Expected 0 deletions, got {deleted_count}"

        # Verify that 12345678 and 12345679 were NOT deleted
        assert (
            "12345678" not in deleted_ids
        ), f"Model 12345678 should NOT be deleted. Deleted IDs: {deleted_ids}"
        assert (
            "12345679" not in deleted_ids
        ), f"Model 12345679 should NOT be deleted. Deleted IDs: {deleted_ids}"


@pytest.mark.asyncio
async def test_get_config_from_file(tmp_path, monkeypatch):
    """
    Test the _get_config_from_file method of ProxyConfig class.
    Tests various scenarios: valid file, non-existent file, no file path, None config.
    """
    import yaml

    from litellm.proxy.proxy_server import ProxyConfig

    # Create a ProxyConfig instance
    proxy_config = ProxyConfig()

    # Test Case 1: Valid YAML config file exists
    test_config = {
        "model_list": [{"model_name": "gpt-4", "litellm_params": {"model": "gpt-4"}}],
        "general_settings": {"master_key": "sk-test"},
        "router_settings": {"enable_pre_call_checks": True},
        "litellm_settings": {"drop_params": True},
    }

    config_file = tmp_path / "test_config.yaml"
    with open(config_file, "w") as f:
        yaml.dump(test_config, f)

    # Clear global user_config_file_path for this test
    monkeypatch.setattr("litellm.proxy.proxy_server.user_config_file_path", None)

    result = await proxy_config._get_config_from_file(str(config_file))
    assert result == test_config

    # Verify that user_config_file_path was set
    from litellm.proxy.proxy_server import user_config_file_path

    assert user_config_file_path == str(config_file)

    # Test Case 2: File path provided but file doesn't exist
    non_existent_file = tmp_path / "non_existent.yaml"

    with pytest.raises(Exception, match=f"Config file not found: {non_existent_file}"):
        await proxy_config._get_config_from_file(str(non_existent_file))

    # Test Case 3: No file path provided (should return default config)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_config_file_path", None)

    expected_default = {
        "model_list": [],
        "general_settings": {},
        "router_settings": {},
        "litellm_settings": {},
    }

    result = await proxy_config._get_config_from_file(None)
    assert result == expected_default

    # Test Case 4: Empty YAML file (should raise exception for None config)
    empty_file = tmp_path / "empty_config.yaml"
    with open(empty_file, "w") as f:
        f.write("")  # Write empty content which will result in None when loaded

    with pytest.raises(Exception, match="Config cannot be None or Empty."):
        await proxy_config._get_config_from_file(str(empty_file))

    # Test Case 5: Using global user_config_file_path when no config_file_path provided
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.user_config_file_path", str(config_file)
    )

    result = await proxy_config._get_config_from_file(None)
    assert result == test_config


def test_normalize_datetime_for_sorting():
    """
    Test the _normalize_datetime_for_sorting function.
    Tests various scenarios: None values, ISO format strings, datetime objects (naive and aware).
    """
    from litellm.proxy.proxy_server import _normalize_datetime_for_sorting

    # Test Case 1: None value
    assert _normalize_datetime_for_sorting(None) is None

    # Test Case 2: ISO format string with 'Z' suffix
    dt_str_z = "2024-01-15T10:30:00Z"
    result = _normalize_datetime_for_sorting(dt_str_z)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc
    assert result.year == 2024
    assert result.month == 1
    assert result.day == 15
    assert result.hour == 10
    assert result.minute == 30

    # Test Case 3: ISO format string without 'Z' suffix (naive)
    dt_str_naive = "2024-01-15T10:30:00"
    result = _normalize_datetime_for_sorting(dt_str_naive)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc

    # Test Case 4: ISO format string with timezone offset
    dt_str_tz = "2024-01-15T10:30:00+05:00"
    result = _normalize_datetime_for_sorting(dt_str_tz)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc
    # Should convert from +05:00 to UTC (subtract 5 hours)
    assert result.hour == 5  # 10:30 - 5 hours = 5:30 UTC

    # Test Case 5: Naive datetime object
    naive_dt = datetime(2024, 1, 15, 10, 30, 0)
    result = _normalize_datetime_for_sorting(naive_dt)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc
    assert result.year == 2024
    assert result.month == 1
    assert result.day == 15

    # Test Case 6: Timezone-aware datetime object (non-UTC)
    from datetime import timedelta
    aware_dt = datetime(2024, 1, 15, 10, 30, 0, tzinfo=timezone(timedelta(hours=5)))
    result = _normalize_datetime_for_sorting(aware_dt)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc
    # Should convert from +05:00 to UTC
    assert result.hour == 5

    # Test Case 7: UTC-aware datetime object
    utc_dt = datetime(2024, 1, 15, 10, 30, 0, tzinfo=timezone.utc)
    result = _normalize_datetime_for_sorting(utc_dt)
    assert result is not None
    assert isinstance(result, datetime)
    assert result.tzinfo == timezone.utc
    assert result == utc_dt

    # Test Case 8: Invalid string format
    invalid_str = "not-a-date"
    result = _normalize_datetime_for_sorting(invalid_str)
    assert result is None

    # Test Case 9: Invalid type (should return None)
    result = _normalize_datetime_for_sorting(12345)
    assert result is None


@pytest.mark.asyncio
async def test_add_proxy_budget_to_db_only_creates_user_no_keys():
    """
    Test that _add_proxy_budget_to_db only creates a user and no keys are added.

    This validates that generate_key_helper_fn is called with table_name="user"
    which should prevent key creation in LiteLLM_VerificationToken table.
    """
    from unittest.mock import AsyncMock, patch

    import litellm
    from litellm.proxy.proxy_server import ProxyStartupEvent

    # Set up required litellm settings
    litellm.budget_duration = "30d"
    litellm.max_budget = 100.0

    litellm_proxy_budget_name = "litellm-proxy-budget"

    # Mock generate_key_helper_fn to capture its call arguments
    mock_generate_key_helper = AsyncMock(
        return_value={
            "user_id": litellm_proxy_budget_name,
            "max_budget": 100.0,
            "budget_duration": "30d",
            "spend": 0,
            "models": [],
        }
    )

    # Patch generate_key_helper_fn in proxy_server where it's being called from
    with patch(
        "litellm.proxy.proxy_server.generate_key_helper_fn", mock_generate_key_helper
    ):
        # Call the function under test
        ProxyStartupEvent._add_proxy_budget_to_db(litellm_proxy_budget_name)

        # Allow async task to complete
        import asyncio

        await asyncio.sleep(0.1)

        # Verify that generate_key_helper_fn was called
        mock_generate_key_helper.assert_called_once()
        call_args = mock_generate_key_helper.call_args

        # Verify critical parameters that prevent key creation
        assert call_args.kwargs["request_type"] == "user"
        assert call_args.kwargs["table_name"] == "user"
        assert call_args.kwargs["user_id"] == litellm_proxy_budget_name
        assert call_args.kwargs["max_budget"] == 100.0
        assert call_args.kwargs["budget_duration"] == "30d"
        assert call_args.kwargs["query_type"] == "update_data"


@pytest.mark.asyncio
async def test_custom_ui_sso_sign_in_handler_config_loading():
    """
    Test that custom_ui_sso_sign_in_handler from config gets properly loaded into the global variable
    """
    import tempfile
    from unittest.mock import MagicMock, patch

    import yaml

    from litellm.proxy.proxy_server import ProxyConfig

    # Create a test config with custom_ui_sso_sign_in_handler
    test_config = {
        "general_settings": {
            "custom_ui_sso_sign_in_handler": "custom_hooks.custom_ui_sso_hook.custom_ui_sso_sign_in_handler"
        },
        "model_list": [],
        "router_settings": {},
        "litellm_settings": {},
    }

    # Create temporary config file
    with tempfile.NamedTemporaryFile(mode="w", suffix=".yaml", delete=False) as f:
        yaml.dump(test_config, f)
        config_file_path = f.name

    # Mock the get_instance_fn to return a mock handler
    mock_custom_handler = MagicMock()

    try:
        with patch(
            "litellm.proxy.proxy_server.get_instance_fn",
            return_value=mock_custom_handler,
        ) as mock_get_instance:
            # Create ProxyConfig instance and load config
            proxy_config = ProxyConfig()
            # Create a mock router since load_config requires it
            mock_router = MagicMock()
            await proxy_config.load_config(
                router=mock_router, config_file_path=config_file_path
            )

            # Verify get_instance_fn was called with correct parameters
            mock_get_instance.assert_called_with(
                value="custom_hooks.custom_ui_sso_hook.custom_ui_sso_sign_in_handler",
                config_file_path=config_file_path,
            )

            # Verify the global variable was set
            from litellm.proxy.proxy_server import user_custom_ui_sso_sign_in_handler

            assert user_custom_ui_sso_sign_in_handler == mock_custom_handler

    finally:
        # Clean up temporary file
        import os

        os.unlink(config_file_path)


@pytest.mark.asyncio
async def test_load_environment_variables_direct_and_os_environ():
    """
    Test _load_environment_variables method with direct values and os.environ/ prefixed values
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test config with both direct values and os.environ/ prefixed values
    test_config = {
        "environment_variables": {
            "DIRECT_VAR": "direct_value",
            "NUMERIC_VAR": 12345,
            "BOOL_VAR": True,
            "SECRET_VAR": "os.environ/ACTUAL_SECRET_VAR",
        }
    }

    # Mock get_secret_str to return a resolved value
    mock_secret_value = "resolved_secret_value"

    with patch(
        "litellm.proxy.proxy_server.get_secret_str", return_value=mock_secret_value
    ) as mock_get_secret:
        with patch.dict(
            os.environ, {}, clear=False
        ):  # Don't clear existing env vars, just track changes
            # Call the method under test
            proxy_config._load_environment_variables(test_config)

            # Verify direct environment variables were set correctly
            assert os.environ["DIRECT_VAR"] == "direct_value"
            assert os.environ["NUMERIC_VAR"] == "12345"  # Should be converted to string
            assert os.environ["BOOL_VAR"] == "True"  # Should be converted to string

            # Verify os.environ/ prefixed variable was resolved and set
            assert os.environ["SECRET_VAR"] == mock_secret_value

            # Verify get_secret_str was called with the correct value
            mock_get_secret.assert_called_once_with(
                secret_name="os.environ/ACTUAL_SECRET_VAR"
            )


@pytest.mark.asyncio
async def test_load_environment_variables_litellm_license_and_edge_cases():
    """
    Test _load_environment_variables method with LITELLM_LICENSE special handling and edge cases
    """
    from unittest.mock import MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: LITELLM_LICENSE in environment_variables
    test_config_with_license = {
        "environment_variables": {
            "LITELLM_LICENSE": "test_license_key",
            "OTHER_VAR": "other_value",
        }
    }

    # Mock _license_check
    mock_license_check = MagicMock()
    mock_license_check.is_premium.return_value = True

    with patch("litellm.proxy.proxy_server._license_check", mock_license_check):
        with patch.dict(os.environ, {}, clear=False):
            # Call the method under test
            proxy_config._load_environment_variables(test_config_with_license)

            # Verify LITELLM_LICENSE was set in environment
            assert os.environ["LITELLM_LICENSE"] == "test_license_key"

            # Verify license check was updated
            assert mock_license_check.license_str == "test_license_key"
            mock_license_check.is_premium.assert_called_once()

    # Test Case 2: No environment_variables in config
    test_config_no_env_vars = {}

    # This should not raise any errors and should return without doing anything
    result = proxy_config._load_environment_variables(test_config_no_env_vars)
    assert result is None  # Method returns None

    # Test Case 3: environment_variables is None
    test_config_none_env_vars = {"environment_variables": None}

    # This should not raise any errors and should return without doing anything
    result = proxy_config._load_environment_variables(test_config_none_env_vars)
    assert result is None  # Method returns None

    # Test Case 4: os.environ/ prefix but get_secret_str returns None
    test_config_secret_none = {
        "environment_variables": {"FAILED_SECRET": "os.environ/NONEXISTENT_SECRET"}
    }

    with patch("litellm.proxy.proxy_server.get_secret_str", return_value=None):
        with patch.dict(os.environ, {}, clear=False):
            # Call the method under test
            proxy_config._load_environment_variables(test_config_secret_none)

            # Verify that the environment variable was not set when secret resolution fails
            assert "FAILED_SECRET" not in os.environ


@pytest.mark.asyncio
async def test_write_config_to_file(monkeypatch):
    """
    Do not write config to file if store_model_in_db is True
    """
    from unittest.mock import AsyncMock, MagicMock, mock_open, patch

    from litellm.proxy.proxy_server import ProxyConfig

    # Set store_model_in_db to True
    monkeypatch.setattr("litellm.proxy.proxy_server.store_model_in_db", True)

    # Mock prisma_client to not be None (so DB path is taken)
    mock_prisma_client = AsyncMock()
    mock_prisma_client.insert_data = AsyncMock()
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)

    # Mock general_settings
    mock_general_settings = {"store_model_in_db": True}
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.general_settings", mock_general_settings
    )

    # Mock user_config_file_path
    test_config_path = "/tmp/test_config.yaml"
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.user_config_file_path", test_config_path
    )

    proxy_config = ProxyConfig()

    # Mock the open function to track if file writing is attempted
    mock_file_open = mock_open()

    with patch("builtins.open", mock_file_open), patch("yaml.dump") as mock_yaml_dump:
        # Call save_config with test data
        test_config = {"key": "value", "model_list": ["model1", "model2"]}
        await proxy_config.save_config(new_config=test_config)

        # Verify that file was NOT opened for writing (since store_model_in_db=True)
        mock_file_open.assert_not_called()
        mock_yaml_dump.assert_not_called()

        # Verify that database insert was called instead
        mock_prisma_client.insert_data.assert_called_once()

        # Verify the config passed to DB has model_list removed
        call_args = mock_prisma_client.insert_data.call_args
        assert call_args.kwargs["data"] == {
            "key": "value"
        }  # model_list should be popped
        assert call_args.kwargs["table_name"] == "config"


@pytest.mark.asyncio
async def test_write_config_to_file_when_store_model_in_db_false(monkeypatch):
    """
    Test that config IS written to file when store_model_in_db is False
    """
    from unittest.mock import AsyncMock, MagicMock, mock_open, patch

    from litellm.proxy.proxy_server import ProxyConfig

    # Set store_model_in_db to False
    monkeypatch.setattr("litellm.proxy.proxy_server.store_model_in_db", False)

    # Mock prisma_client to be None (so file path is taken)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", None)

    # Mock general_settings
    mock_general_settings = {"store_model_in_db": False}
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.general_settings", mock_general_settings
    )

    # Mock user_config_file_path
    test_config_path = "/tmp/test_config.yaml"
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.user_config_file_path", test_config_path
    )

    proxy_config = ProxyConfig()

    # Mock the open function and yaml.dump
    mock_file_open = mock_open()

    with patch("builtins.open", mock_file_open), patch("yaml.dump") as mock_yaml_dump:
        # Call save_config with test data
        test_config = {"key": "value", "other_key": "other_value"}
        await proxy_config.save_config(new_config=test_config)

        # Verify that file WAS opened for writing (since store_model_in_db=False)
        mock_file_open.assert_called_once_with(f"{test_config_path}", "w")

        # Verify yaml.dump was called with the config
        mock_yaml_dump.assert_called_once_with(
            test_config,
            mock_file_open.return_value.__enter__.return_value,
            default_flow_style=False,
        )


@pytest.mark.asyncio
async def test_async_data_generator_midstream_error():
    """
    Test async_data_generator handles midstream error from async_post_call_streaming_hook
    Specifically testing the case where Azure Content Safety Guardrail returns an error
    """
    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import async_data_generator
    from litellm.proxy.utils import ProxyLogging

    # Create mock objects
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_request_data = {
        "model": "gpt-3.5-turbo",
        "messages": [{"role": "user", "content": "test"}],
    }

    # Mock response chunks - simulating normal streaming that gets interrupted
    mock_chunks = [
        {"choices": [{"delta": {"content": "Hello"}}]},
        {"choices": [{"delta": {"content": " world"}}]},
        {"choices": [{"delta": {"content": " this"}}]},
    ]

    # Mock the proxy_logging_obj
    mock_proxy_logging_obj = MagicMock(spec=ProxyLogging)

    # Mock async_post_call_streaming_iterator_hook to yield chunks
    async def mock_streaming_iterator(*args, **kwargs):
        for chunk in mock_chunks:
            yield chunk

    mock_proxy_logging_obj.async_post_call_streaming_iterator_hook = (
        mock_streaming_iterator
    )

    # Mock async_post_call_streaming_hook to return error on third chunk
    def mock_streaming_hook(*args, **kwargs):
        chunk = kwargs.get("response")
        # Return error message for the third chunk (simulating guardrail trigger)
        if chunk == mock_chunks[2]:
            return 'data: {"error": {"error": "Azure Content Safety Guardrail: Hate crossed severity 2, Got severity: 2"}}'
        # Return normal chunks for first two
        return chunk

    mock_proxy_logging_obj.async_post_call_streaming_hook = AsyncMock(
        side_effect=mock_streaming_hook
    )
    mock_proxy_logging_obj.post_call_failure_hook = AsyncMock()

    # Mock the global proxy_logging_obj
    with patch("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj):
        # Create a mock response object
        mock_response = MagicMock()

        # Collect all yielded data from the generator
        yielded_data = []
        try:
            async for data in async_data_generator(
                mock_response, mock_user_api_key_dict, mock_request_data
            ):
                yielded_data.append(data)
        except Exception as e:
            # If there's an exception, that's also part of what we want to test
            pass

    # Verify the results
    assert (
        len(yielded_data) >= 3
    ), f"Expected at least 3 chunks, got {len(yielded_data)}: {yielded_data}"

    # First two chunks should be normal data
    assert yielded_data[0].startswith(
        "data: "
    ), f"First chunk should start with 'data: ', got: {yielded_data[0]}"
    assert yielded_data[1].startswith(
        "data: "
    ), f"Second chunk should start with 'data: ', got: {yielded_data[1]}"

    # The error message should be yielded
    error_found = False
    done_found = False

    for data in yielded_data:
        if "Azure Content Safety Guardrail: Hate crossed severity 2" in data:
            error_found = True
        if "data: [DONE]" in data:
            done_found = True

    assert (
        error_found
    ), f"Error message should be found in yielded data. Got: {yielded_data}"
    assert done_found, f"[DONE] message should be found at the end. Got: {yielded_data}"

    # Verify that the streaming hook was called for each chunk
    assert mock_proxy_logging_obj.async_post_call_streaming_hook.call_count == len(
        mock_chunks
    )

    # Verify that post_call_failure_hook was NOT called (since this is not an exception case)
    mock_proxy_logging_obj.post_call_failure_hook.assert_not_called()


def _has_nested_none_values(obj, path="root"):
    """
    Recursively check if an object contains nested None values.

    Args:
        obj: The object to check
        path: Current path in the object tree (for debugging)

    Returns:
        List of paths where None values were found
    """
    none_paths = []

    if obj is None:
        none_paths.append(path)
    elif isinstance(obj, dict):
        for key, value in obj.items():
            none_paths.extend(_has_nested_none_values(value, f"{path}.{key}"))
    elif isinstance(obj, (list, tuple)):
        for i, item in enumerate(obj):
            none_paths.extend(_has_nested_none_values(item, f"{path}[{i}]"))
    elif hasattr(obj, "__dict__"):
        # Handle object attributes
        for key, value in obj.__dict__.items():
            if not key.startswith("_"):  # Skip private attributes
                none_paths.extend(_has_nested_none_values(value, f"{path}.{key}"))

    return none_paths


@pytest.mark.asyncio
async def test_chat_completion_result_no_nested_none_values():
    """
    Test that chat_completion result doesn't have nested None values when using exclude_none=True
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from fastapi import Request, Response
    from pydantic import BaseModel

    import litellm
    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import chat_completion

    # Create a mock ModelResponse with nested None values
    mock_model_response = litellm.ModelResponse()
    mock_model_response.id = "test-id"
    mock_model_response.model = "gpt-3.5-turbo"
    mock_model_response.object = "chat.completion"
    mock_model_response.created = 1234567890

    # Create message with None values that should be excluded
    mock_message = litellm.Message(
        content="Hello, world!",
        role="assistant",
        function_call=None,  # This should be excluded
        tool_calls=None,  # This should be excluded
        audio=None,  # This should be excluded
        reasoning_content=None,  # This should be excluded
        thinking_blocks=None,  # This should be excluded
        annotations=None,  # This should be excluded
    )

    # Create choice with potential None values
    mock_choice = litellm.Choices(
        finish_reason="stop",
        index=0,
        message=mock_message,
        logprobs=None,  # This should be excluded when exclude_none=True
    )

    mock_model_response.choices = [mock_choice]
    setattr(
        mock_model_response,
        "usage",
        litellm.Usage(prompt_tokens=10, completion_tokens=5, total_tokens=15),
    )

    # Verify the mock has None values before serialization
    raw_dict = mock_model_response.model_dump()
    none_paths_before = _has_nested_none_values(raw_dict)
    assert (
        len(none_paths_before) > 0
    ), "Mock should have None values before exclude_none=True"

    # Mock the request processing to return our mock response
    mock_base_processor = MagicMock()
    mock_base_processor.base_process_llm_request = AsyncMock(
        return_value=mock_model_response
    )

    # Mock other dependencies
    mock_request = MagicMock(spec=Request)
    mock_response = MagicMock(spec=Response)
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)

    with patch(
        "litellm.proxy.proxy_server._read_request_body",
        return_value={"model": "gpt-3.5-turbo", "messages": []},
    ), patch(
        "litellm.proxy.proxy_server.ProxyBaseLLMRequestProcessing",
        return_value=mock_base_processor,
    ):

        # Call the chat_completion function
        result = await chat_completion(
            request=mock_request,
            fastapi_response=mock_response,
            user_api_key_dict=mock_user_api_key_dict,
        )

    # Verify the result is a dict (since isinstance(result, BaseModel) was True)
    assert isinstance(result, dict), f"Expected dict result, got {type(result)}"

    # Check that there are no nested None values in the result
    none_paths_after = _has_nested_none_values(result)
    assert (
        len(none_paths_after) == 0
    ), f"Result should not contain nested None values. Found None at: {none_paths_after}"

    # Verify essential fields are present
    assert "id" in result
    assert "model" in result
    assert "object" in result
    assert "created" in result
    assert "choices" in result
    assert "usage" in result

    # Verify that the choices contain the expected message content
    assert len(result["choices"]) == 1
    assert result["choices"][0]["message"]["content"] == "Hello, world!"
    assert result["choices"][0]["message"]["role"] == "assistant"

    # Verify that None fields were excluded (should not be present in the dict)
    message = result["choices"][0]["message"]
    excluded_fields = [
        "function_call",
        "tool_calls",
        "audio",
        "reasoning_content",
        "thinking_blocks",
        "annotations",
    ]
    for field in excluded_fields:
        assert (
            field not in message
        ), f"Field '{field}' should be excluded when it's None"


# ============================================================================
# Price Data Reload Tests
# ============================================================================


class TestPriceDataReloadAPI:
    """Test cases for price data reload API endpoints"""

    @pytest.fixture
    def client_with_auth(self):
        """Create a test client with authentication"""
        from litellm.proxy._types import LitellmUserRoles
        from litellm.proxy.proxy_server import cleanup_router_config_variables

        cleanup_router_config_variables()
        filepath = os.path.dirname(os.path.abspath(__file__))
        config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
        asyncio.run(initialize(config=config_fp, debug=True))

        # Mock admin user authentication
        mock_auth = MagicMock()
        mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        return TestClient(app)

    def test_reload_model_cost_map_admin_access(self, client_with_auth):
        """Test that admin users can access the reload endpoint"""
        with patch(
            "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map"
        ) as mock_get_map:
            mock_get_map.return_value = {
                "gpt-3.5-turbo": {"input_cost_per_token": 0.001}
            }
            # Mock the database connection
            with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
                mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

                response = client_with_auth.post("/reload/model_cost_map")

                assert response.status_code == 200
                data = response.json()
                assert data["status"] == "success"
                assert "message" in data
                assert "timestamp" in data
                assert "models_count" in data
                # The new implementation immediately reloads and returns the count
                assert (
                    "Price data reloaded successfully! 1 models updated."
                    in data["message"]
                )
                assert data["models_count"] == 1

    def test_reload_model_cost_map_non_admin_access(self, client_with_auth):
        """Test that non-admin users cannot access the reload endpoint"""
        # Mock non-admin user
        mock_auth = MagicMock()
        mock_auth.user_role = "user"  # Non-admin role
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        response = client_with_auth.post("/reload/model_cost_map")

        assert response.status_code == 403
        data = response.json()
        assert "Access denied" in data["detail"]
        assert "Admin role required" in data["detail"]

    def test_get_model_cost_map_public_access(self, client_no_auth):
        """Test that the model cost map endpoint is publicly accessible"""
        with patch(
            "litellm.model_cost", {"gpt-3.5-turbo": {"input_cost_per_token": 0.001}}
        ):
            response = client_no_auth.get("/public/litellm_model_cost_map")

            assert response.status_code == 200
            data = response.json()
            assert "gpt-3.5-turbo" in data

    def test_reload_model_cost_map_error_handling(self, client_with_auth):
        """Test error handling in the reload endpoint"""
        with patch(
            "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map"
        ) as mock_get_map:
            mock_get_map.side_effect = Exception("Network error")

            # Mock the database connection
            with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
                mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

                response = client_with_auth.post("/reload/model_cost_map")

                assert (
                    response.status_code == 500
                )  # The new implementation immediately reloads and fails on error
                data = response.json()
                assert "Failed to reload model cost map" in data["detail"]

    def test_schedule_model_cost_map_reload_admin_access(self, client_with_auth):
        """Test that admin users can schedule periodic reload"""
        with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
            # Mock database upsert
            mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

            response = client_with_auth.post("/schedule/model_cost_map_reload?hours=6")

            assert response.status_code == 200
            data = response.json()
            assert data["status"] == "success"
            assert data["interval_hours"] == 6
            assert "message" in data
            assert "timestamp" in data

    def test_schedule_model_cost_map_reload_non_admin_access(self, client_with_auth):
        """Test that non-admin users cannot schedule periodic reload"""
        # Mock non-admin user
        mock_auth = MagicMock()
        mock_auth.user_role = "user"  # Non-admin role
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        response = client_with_auth.post("/schedule/model_cost_map_reload?hours=6")

        assert response.status_code == 403
        data = response.json()
        assert "Access denied" in data["detail"]
        assert "Admin role required" in data["detail"]

    def test_schedule_model_cost_map_reload_invalid_hours(self, client_with_auth):
        """Test that invalid hours parameter is rejected"""
        response = client_with_auth.post("/schedule/model_cost_map_reload?hours=0")

        assert response.status_code == 400
        data = response.json()
        assert "Hours must be greater than 0" in data["detail"]

    def test_cancel_model_cost_map_reload_admin_access(self, client_with_auth):
        """Test that admin users can cancel periodic reload"""
        with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
            # Mock database delete
            mock_prisma.db.litellm_config.delete = AsyncMock(return_value=None)

            response = client_with_auth.delete("/schedule/model_cost_map_reload")

            assert response.status_code == 200
            data = response.json()
            assert data["status"] == "success"
            assert "message" in data
            assert "timestamp" in data

    def test_cancel_model_cost_map_reload_non_admin_access(self, client_with_auth):
        """Test that non-admin users cannot cancel periodic reload"""
        # Mock non-admin user
        mock_auth = MagicMock()
        mock_auth.user_role = "user"  # Non-admin role
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        response = client_with_auth.delete("/schedule/model_cost_map_reload")

        assert response.status_code == 403
        data = response.json()
        assert "Access denied" in data["detail"]
        assert "Admin role required" in data["detail"]

    def test_get_model_cost_map_reload_status_admin_access(self, client_with_auth):
        """Test that admin users can get reload status"""
        with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
            # Mock database config record
            mock_config = MagicMock()
            mock_config.param_value = {"interval_hours": 6, "force_reload": False}
            mock_prisma.db.litellm_config.find_unique = AsyncMock(
                return_value=mock_config
            )

            # Mock the last reload time and current time
            with patch(
                "litellm.proxy.proxy_server.last_model_cost_map_reload",
                "2024-01-01T06:00:00",
            ):
                with patch("litellm.proxy.proxy_server.datetime") as mock_datetime:
                    # Mock current time to be 1 hour after last reload
                    mock_datetime.utcnow.return_value = datetime(2024, 1, 1, 7, 0, 0)
                    mock_datetime.fromisoformat = datetime.fromisoformat

                    response = client_with_auth.get(
                        "/schedule/model_cost_map_reload/status"
                    )

                    assert response.status_code == 200
                    data = response.json()
                    assert data["scheduled"] == True
                    assert data["interval_hours"] == 6
                    assert data["last_run"] == "2024-01-01T06:00:00"
                    assert data["next_run"] == "2024-01-01T12:00:00"

    def test_get_model_cost_map_reload_status_non_admin_access(self, client_with_auth):
        """Test that non-admin users cannot get reload status"""
        # Mock non-admin user
        mock_auth = MagicMock()
        mock_auth.user_role = "user"  # Non-admin role
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        response = client_with_auth.get("/schedule/model_cost_map_reload/status")

        assert response.status_code == 403
        data = response.json()
        assert "Access denied" in data["detail"]
        assert "Admin role required" in data["detail"]

    def test_get_model_cost_map_reload_status_no_config(self, client_with_auth):
        """Test that status returns not scheduled when no config exists"""
        with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
            mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=None)

            response = client_with_auth.get("/schedule/model_cost_map_reload/status")

            assert response.status_code == 200
            data = response.json()
            assert data["scheduled"] == False
            assert data["interval_hours"] == None
            assert data["last_run"] == None
            assert data["next_run"] == None

    def test_get_model_cost_map_reload_status_no_interval(self, client_with_auth):
        """Test that status returns not scheduled when no interval is configured"""
        with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
            # Mock config with no interval
            mock_config = MagicMock()
            mock_config.param_value = {"interval_hours": None, "force_reload": False}
            mock_prisma.db.litellm_config.find_unique = AsyncMock(
                return_value=mock_config
            )

            response = client_with_auth.get("/schedule/model_cost_map_reload/status")

            assert response.status_code == 200
            data = response.json()
            assert data["scheduled"] == False
            assert data["interval_hours"] == None
            assert data["last_run"] == None
            assert data["next_run"] == None


class TestPriceDataReloadIntegration:
    """Integration tests for the complete price data reload feature"""

    @pytest.fixture
    def client_with_auth(self):
        """Create a test client with authentication"""
        from litellm.proxy._types import LitellmUserRoles
        from litellm.proxy.proxy_server import cleanup_router_config_variables

        cleanup_router_config_variables()
        filepath = os.path.dirname(os.path.abspath(__file__))
        config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
        asyncio.run(initialize(config=config_fp, debug=True))

        # Mock admin user authentication
        mock_auth = MagicMock()
        mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN
        app.dependency_overrides[user_api_key_auth] = lambda: mock_auth

        return TestClient(app)

    def test_complete_reload_flow(self, client_with_auth):
        """Test the complete reload flow from API to model cost update"""
        # Mock the model cost map
        mock_cost_map = {
            "gpt-3.5-turbo": {
                "input_cost_per_token": 0.001,
                "output_cost_per_token": 0.002,
            },
            "gpt-4": {"input_cost_per_token": 0.03, "output_cost_per_token": 0.06},
        }

        with patch(
            "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map"
        ) as mock_get_map:
            mock_get_map.return_value = mock_cost_map

            # Mock the database connection
            with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma:
                mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

                # Test reload endpoint
                response = client_with_auth.post("/reload/model_cost_map")
                assert response.status_code == 200

                # Test get endpoint
                response = client_with_auth.get("/public/litellm_model_cost_map")
                assert response.status_code == 200

    def test_distributed_reload_check_function(self):
        """Test the _check_and_reload_model_cost_map function"""
        from litellm.proxy.proxy_server import ProxyConfig

        proxy_config = ProxyConfig()

        # Mock prisma client
        mock_prisma = MagicMock()

        # Test case 1: No config in database
        mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=None)

        # Should return early without reloading
        asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma))

        # Test case 2: Config with interval but not time to reload
        mock_config = MagicMock()
        mock_config.param_value = {"interval_hours": 6, "force_reload": False}
        mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config)

        # Mock current time and last reload time
        with patch(
            "litellm.proxy.proxy_server.last_model_cost_map_reload",
            "2024-01-01T06:00:00",
        ):
            with patch("litellm.proxy.proxy_server.datetime") as mock_datetime:
                mock_datetime.utcnow.return_value = datetime(
                    2024, 1, 1, 7, 0, 0
                )  # 1 hour later

                # Should not reload (only 1 hour passed, need 6)
                asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma))

        # Test case 3: Config with force reload
        mock_config.param_value = {"interval_hours": 6, "force_reload": True}
        mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config)
        mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

        with patch(
            "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map"
        ) as mock_get_map:
            mock_get_map.return_value = {
                "gpt-3.5-turbo": {"input_cost_per_token": 0.001}
            }

            # Should reload due to force flag
            asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma))

            # Verify force_reload was reset to False
            mock_prisma.db.litellm_config.upsert.assert_called()
            call_args = mock_prisma.db.litellm_config.upsert.call_args
            # The param_value is now a JSON string, so we need to parse it
            param_value_json = call_args[1]["data"]["update"]["param_value"]
            param_value_dict = json.loads(param_value_json)
            assert param_value_dict["force_reload"] == False

    def test_config_file_parsing(self):
        """Test parsing of config file with reload settings"""
        config_content = """
general_settings:
  master_key: sk-1234
  model_cost_map_reload_interval: 21600

model_list:
  - model_name: gpt-3.5-turbo
    litellm_params:
      model: gpt-3.5-turbo
  - model_name: gpt-4
    litellm_params:
      model: gpt-4
"""

        # Parse the config
        config = yaml.safe_load(config_content)

        # Verify the reload setting is present
        assert "general_settings" in config
        assert "model_cost_map_reload_interval" in config["general_settings"]
        assert config["general_settings"]["model_cost_map_reload_interval"] == 21600

        # Verify models are present
        assert "model_list" in config
        assert len(config["model_list"]) == 2

    def test_database_config_storage(self):
        """Test that configuration is properly stored in database"""
        # Mock prisma client
        mock_prisma = MagicMock()

        # Test the database upsert call that would be made by the schedule endpoint
        mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

        # Simulate the database call that the schedule endpoint would make
        asyncio.run(
            mock_prisma.db.litellm_config.upsert(
                where={"param_name": "model_cost_map_reload_config"},
                data={
                    "create": {
                        "param_name": "model_cost_map_reload_config",
                        "param_value": {"interval_hours": 6, "force_reload": False},
                    },
                    "update": {
                        "param_value": {"interval_hours": 6, "force_reload": False}
                    },
                },
            )
        )

        # Verify database upsert was called with correct data
        mock_prisma.db.litellm_config.upsert.assert_called_once()
        call_args = mock_prisma.db.litellm_config.upsert.call_args
        assert call_args[1]["where"]["param_name"] == "model_cost_map_reload_config"
        assert call_args[1]["data"]["create"]["param_value"]["interval_hours"] == 6
        assert call_args[1]["data"]["create"]["param_value"]["force_reload"] == False

    def test_manual_reload_force_flag(self):
        """Test that manual reload sets force flag correctly"""
        # Mock prisma client
        mock_prisma = MagicMock()

        # Test the database upsert call that would be made by the manual reload endpoint
        mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None)

        # Simulate the database call that the manual reload endpoint would make
        asyncio.run(
            mock_prisma.db.litellm_config.upsert(
                where={"param_name": "model_cost_map_reload_config"},
                data={
                    "create": {
                        "param_name": "model_cost_map_reload_config",
                        "param_value": {"interval_hours": None, "force_reload": True},
                    },
                    "update": {"param_value": {"force_reload": True}},
                },
            )
        )

        # Verify force_reload flag was set
        mock_prisma.db.litellm_config.upsert.assert_called_once()
        call_args = mock_prisma.db.litellm_config.upsert.call_args
        assert call_args[1]["data"]["update"]["param_value"]["force_reload"] == True


@pytest.mark.asyncio
async def test_add_router_settings_from_db_config_merge_logic():
    """
    Test the _add_router_settings_from_db_config method's merge logic.

    This tests how router settings from config file and database are combined,
    including scenarios where nested dictionaries should be properly merged.
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    # Create ProxyConfig instance
    proxy_config = ProxyConfig()

    # Mock router
    mock_router = MagicMock()
    mock_router.update_settings = MagicMock()

    # Test Case 1: Both config and DB settings exist - should merge them
    config_data = {
        "router_settings": {
            "routing_strategy": "usage-based-routing",
            "model_group_alias": {"gpt-4": "openai-gpt-4"},
            "enable_pre_call_checks": True,
            "timeout": 30,
            "nested_config": {"setting1": "config_value1", "setting2": "config_value2"},
        }
    }

    # Mock database config record
    mock_db_config = MagicMock()
    mock_db_config.param_value = {
        "routing_strategy": "least-busy",  # This should override config value
        "retry_delay": 2,  # This is new, should be added
        "nested_config": {
            "setting2": "db_value2",  # This should override config value
            "setting3": "db_value3",  # This is new, should be added
        },
    }

    # Mock prisma client
    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(
        return_value=mock_db_config
    )

    # Call the method under test
    await proxy_config._add_router_settings_from_db_config(
        config_data=config_data,
        llm_router=mock_router,
        prisma_client=mock_prisma_client,
    )

    # Verify find_first was called with correct parameters
    mock_prisma_client.db.litellm_config.find_first.assert_called_once_with(
        where={"param_name": "router_settings"}
    )

    # Verify update_settings was called
    mock_router.update_settings.assert_called_once()

    # Get the actual settings passed to update_settings
    call_args = mock_router.update_settings.call_args
    combined_settings = call_args[1]  # kwargs

    # Verify the merge results
    # DB values should override config values
    assert combined_settings["routing_strategy"] == "least-busy"

    # Config-only values should be preserved
    assert combined_settings["model_group_alias"] == {"gpt-4": "openai-gpt-4"}
    assert combined_settings["enable_pre_call_checks"] == True
    assert combined_settings["timeout"] == 30

    # DB-only values should be added
    assert combined_settings["retry_delay"] == 2

    # Nested dictionaries should be merged (but this is shallow merge)
    expected_nested = {
        "setting1": "config_value1",
        "setting2": "db_value2",
        "setting3": "db_value3",
    }
    assert combined_settings["nested_config"] == expected_nested


@pytest.mark.asyncio
async def test_add_router_settings_from_db_config_edge_cases():
    """
    Test edge cases for _add_router_settings_from_db_config method.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()
    mock_router = MagicMock()
    mock_router.update_settings = MagicMock()

    # Test Case 1: No router provided
    await proxy_config._add_router_settings_from_db_config(
        config_data={"router_settings": {"test": "value"}},
        llm_router=None,
        prisma_client=MagicMock(),
    )
    # Should not call anything when router is None
    mock_router.update_settings.assert_not_called()

    # Test Case 2: No prisma client provided
    await proxy_config._add_router_settings_from_db_config(
        config_data={"router_settings": {"test": "value"}},
        llm_router=mock_router,
        prisma_client=None,
    )
    # Should not call anything when prisma_client is None
    mock_router.update_settings.assert_not_called()

    # Test Case 3: DB returns None (no router_settings in DB)
    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None)

    config_data = {"router_settings": {"routing_strategy": "usage-based"}}

    await proxy_config._add_router_settings_from_db_config(
        config_data=config_data,
        llm_router=mock_router,
        prisma_client=mock_prisma_client,
    )

    # Should use only config settings
    mock_router.update_settings.assert_called_once_with(routing_strategy="usage-based")
    mock_router.reset_mock()

    # Test Case 4: Config has no router_settings
    mock_db_config = MagicMock()
    mock_db_config.param_value = {"db_setting": "db_value"}
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(
        return_value=mock_db_config
    )

    await proxy_config._add_router_settings_from_db_config(
        config_data={},  # No router_settings in config
        llm_router=mock_router,
        prisma_client=mock_prisma_client,
    )

    # Should use only DB settings
    mock_router.update_settings.assert_called_once_with(db_setting="db_value")
    mock_router.reset_mock()

    # Test Case 5: Both config and DB router_settings are None/empty
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None)

    await proxy_config._add_router_settings_from_db_config(
        config_data={}, llm_router=mock_router, prisma_client=mock_prisma_client
    )

    # Should not call update_settings when no settings exist
    mock_router.update_settings.assert_not_called()

    # Test Case 6: DB config exists but param_value is not a dict
    mock_db_config_invalid = MagicMock()
    mock_db_config_invalid.param_value = "not_a_dict"
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(
        return_value=mock_db_config_invalid
    )

    config_data = {"router_settings": {"config_setting": "config_value"}}

    await proxy_config._add_router_settings_from_db_config(
        config_data=config_data,
        llm_router=mock_router,
        prisma_client=mock_prisma_client,
    )

    # Should use only config settings when DB param_value is invalid
    mock_router.update_settings.assert_called_once_with(config_setting="config_value")


@pytest.mark.asyncio
async def test_add_router_settings_shallow_merge_behavior():
    """
    Test that the merge behavior is shallow (nested dicts get replaced, not merged).
    This documents the current behavior using _update_dictionary.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()
    mock_router = MagicMock()
    mock_router.update_settings = MagicMock()

    # Config with nested dictionary
    config_data = {
        "router_settings": {
            "nested_setting": {
                "key1": "config_value1",
                "key2": "config_value2",
                "key3": "config_value3",
            },
            "top_level": "config_top",
        }
    }

    # DB config that partially overlaps the nested dictionary
    mock_db_config = MagicMock()
    mock_db_config.param_value = {
        "nested_setting": {
            "key2": "db_value2",  # Override existing key
            "key4": "db_value4",  # Add new key
            # Note: key1 and key3 from config will be lost due to shallow merge
        },
        "top_level": "db_top",  # Override top level
    }

    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(
        return_value=mock_db_config
    )

    await proxy_config._add_router_settings_from_db_config(
        config_data=config_data,
        llm_router=mock_router,
        prisma_client=mock_prisma_client,
    )

    # Get the merged settings
    call_args = mock_router.update_settings.call_args
    merged_settings = call_args[1]

    # Verify shallow merge behavior:
    # The entire nested_setting dict from config is replaced by the DB version
    expected_nested = {
        "key1": "config_value1",
        "key3": "config_value3",
        "key2": "db_value2",
        "key4": "db_value4",
    }

    assert merged_settings["nested_setting"] == expected_nested
    assert merged_settings["top_level"] == "db_top"


@pytest.mark.asyncio
async def test_model_info_v1_oci_secrets_not_leaked():
    """
    Test that model_info_v1 endpoint properly masks OCI sensitive parameters and does not leak secrets.
    """
    from unittest.mock import MagicMock, patch

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import model_info_v1

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = ["oci-grok-test"]

    # Mock model data with OCI sensitive information
    mock_model_data = {
        "model_name": "oci-grok-test",
        "litellm_params": {
            "model": "oci/xai.grok-4",
            "oci_key": "ocid1.api_key.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk",
            "oci_region": "us-phoenix-1",
            "oci_user": "ocid1.user.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk",
            "oci_fingerprint": "aa:bb:cc:dd:ee:ff:11:22:33:44:55:66:77:88:99:00",
            "oci_tenancy": "ocid1.tenancy.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk",
            "oci_key_file": "/path/to/oci_api_key.pem",
            "oci_compartment_id": "ocid1.compartment.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk",
            "drop_params": True
        },
        "model_info": {
            "mode": "completion",
            "id": "test-model-id"
        }
    }

    # Mock the llm_router to return our test data
    mock_router = MagicMock()
    mock_router.get_model_names.return_value = ["oci-grok-test"]
    mock_router.get_model_access_groups.return_value = {}
    mock_router.get_model_list.return_value = [mock_model_data]

    # Mock global variables
    with patch("litellm.proxy.proxy_server.llm_router", mock_router), \
         patch("litellm.proxy.proxy_server.llm_model_list", [mock_model_data]), \
         patch("litellm.proxy.proxy_server.general_settings", {"infer_model_from_keys": False}), \
         patch("litellm.proxy.proxy_server.user_model", None):

        # Call the model_info_v1 endpoint
        result = await model_info_v1(
            user_api_key_dict=mock_user_api_key_dict,
            litellm_model_id=None
        )

        # Verify the result structure
        assert "data" in result
        assert len(result["data"]) == 1

        model_info = result["data"][0]
        litellm_params = model_info["litellm_params"]

        # Verify that sensitive OCI fields are masked
        assert "****" in litellm_params["oci_key"], "oci_key should be masked"
        assert "****" in litellm_params["oci_fingerprint"], "oci_fingerprint should be masked"
        assert "****" in litellm_params["oci_tenancy"], "oci_tenancy should be masked"
        assert "****" in litellm_params["oci_key_file"], "oci_key_file should be masked"

        # Verify that non-sensitive fields are NOT masked
        assert litellm_params["model"] == "oci/xai.grok-4", "model field should not be masked"
        assert litellm_params["oci_region"] == "us-phoenix-1", "oci_region should not be masked"
        assert litellm_params["drop_params"] is True, "drop_params should not be masked"

        # Verify the model field specifically is not masked (this was the original issue)
        assert "****" not in litellm_params["model"], "model field should never be masked"
        assert litellm_params["model"].startswith("oci/"), "model should retain its full value"

        # Verify that actual secret values are not present in the response
        result_str = str(result)
        assert "ocid1.api_key.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk" not in result_str
        assert "aa:bb:cc:dd:ee:ff:11:22:33:44:55:66:77:88:99:00" not in result_str
        assert "ocid1.tenancy.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk" not in result_str
        assert "/path/to/oci_api_key.pem" not in result_str


def test_add_callback_from_db_to_in_memory_litellm_callbacks():
    """
    Test that _add_callback_from_db_to_in_memory_litellm_callbacks correctly adds callbacks
    for success, failure, and combined event types.
    """
    from unittest.mock import MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Mock the callback manager
    mock_callback_manager = MagicMock()

    with patch("litellm.proxy.proxy_server.litellm") as mock_litellm:
        # Set up mock litellm attributes
        mock_litellm._known_custom_logger_compatible_callbacks = []
        mock_litellm.logging_callback_manager = mock_callback_manager

        # Test Case 1: Add success callback
        mock_success_callbacks = []
        proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks(
            callback="prometheus",
            event_types=["success"],
            existing_callbacks=mock_success_callbacks,
        )
        mock_callback_manager.add_litellm_success_callback.assert_called_once_with("prometheus")
        mock_callback_manager.reset_mock()

        # Test Case 2: Add failure callback
        mock_failure_callbacks = []
        proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks(
            callback="langfuse",
            event_types=["failure"],
            existing_callbacks=mock_failure_callbacks,
        )
        mock_callback_manager.add_litellm_failure_callback.assert_called_once_with("langfuse")
        mock_callback_manager.reset_mock()

        # Test Case 3: Add callback for both success and failure
        mock_callbacks = []
        proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks(
            callback="s3",
            event_types=["success", "failure"],
            existing_callbacks=mock_callbacks,
        )
        mock_callback_manager.add_litellm_callback.assert_called_once_with("s3")
        mock_callback_manager.reset_mock()

        # Test Case 4: Don't add callback if it already exists
        existing_callbacks_with_item = ["prometheus"]
        proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks(
            callback="prometheus",
            event_types=["success"],
            existing_callbacks=existing_callbacks_with_item,
        )
        mock_callback_manager.add_litellm_success_callback.assert_not_called()


def test_should_load_db_object_with_supported_db_objects():
    """
    Test _should_load_db_object method with supported_db_objects configuration.

    Verifies that when supported_db_objects is set, only specified object types
    are loaded from the database.
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: supported_db_objects not set - all objects should be loaded
    with patch("litellm.proxy.proxy_server.general_settings", {}):
        assert proxy_config._should_load_db_object(object_type="models") is True
        assert proxy_config._should_load_db_object(object_type="mcp") is True
        assert proxy_config._should_load_db_object(object_type="guardrails") is True
        assert proxy_config._should_load_db_object(object_type="vector_stores") is True

    # Test Case 2: supported_db_objects set to only load MCP
    with patch(
        "litellm.proxy.proxy_server.general_settings",
        {"supported_db_objects": ["mcp"]},
    ):
        assert proxy_config._should_load_db_object(object_type="models") is False
        assert proxy_config._should_load_db_object(object_type="mcp") is True
        assert proxy_config._should_load_db_object(object_type="guardrails") is False
        assert proxy_config._should_load_db_object(object_type="vector_stores") is False
        assert proxy_config._should_load_db_object(object_type="prompts") is False

    # Test Case 3: supported_db_objects set to load multiple types
    with patch(
        "litellm.proxy.proxy_server.general_settings",
        {"supported_db_objects": ["mcp", "guardrails", "vector_stores"]},
    ):
        assert proxy_config._should_load_db_object(object_type="models") is False
        assert proxy_config._should_load_db_object(object_type="mcp") is True
        assert proxy_config._should_load_db_object(object_type="guardrails") is True
        assert proxy_config._should_load_db_object(object_type="vector_stores") is True
        assert proxy_config._should_load_db_object(object_type="prompts") is False

    # Test Case 4: supported_db_objects is not a list (should default to loading all)
    with patch(
        "litellm.proxy.proxy_server.general_settings",
        {"supported_db_objects": "invalid_type"},
    ):
        assert proxy_config._should_load_db_object(object_type="models") is True
        assert proxy_config._should_load_db_object(object_type="mcp") is True

    # Test Case 5: supported_db_objects is an empty list (nothing should be loaded)
    with patch(
        "litellm.proxy.proxy_server.general_settings",
        {"supported_db_objects": []},
    ):
        assert proxy_config._should_load_db_object(object_type="models") is False
        assert proxy_config._should_load_db_object(object_type="mcp") is False
        assert proxy_config._should_load_db_object(object_type="guardrails") is False

    # Test Case 6: Test all available object types
    with patch(
        "litellm.proxy.proxy_server.general_settings",
        {
            "supported_db_objects": [
                "models",
                "mcp",
                "guardrails",
                "vector_stores",
                "pass_through_endpoints",
                "prompts",
                "model_cost_map",
            ]
        },
    ):
        assert proxy_config._should_load_db_object(object_type="models") is True
        assert proxy_config._should_load_db_object(object_type="mcp") is True
        assert proxy_config._should_load_db_object(object_type="guardrails") is True
        assert proxy_config._should_load_db_object(object_type="vector_stores") is True
        assert (
            proxy_config._should_load_db_object(object_type="pass_through_endpoints")
            is True
        )
        assert proxy_config._should_load_db_object(object_type="prompts") is True
        assert proxy_config._should_load_db_object(object_type="model_cost_map") is True


@pytest.mark.asyncio
async def test_tag_cache_update_called():
    """
    Test that update_cache updates tag cache when tags are provided.
    """
    from litellm.caching.caching import DualCache
    from litellm.proxy.proxy_server import user_api_key_cache

    cache = DualCache()

    setattr(
        litellm.proxy.proxy_server,
        "user_api_key_cache",
        cache,
    )

    mock_tag_obj = {
        "tag_name": "test-tag",
        "spend": 10.0,
    }

    with patch.object(cache, "async_get_cache", new=AsyncMock(return_value=mock_tag_obj)) as mock_get_cache:
        with patch.object(cache, "async_set_cache_pipeline", new=AsyncMock()) as mock_set_cache:
            await litellm.proxy.proxy_server.update_cache(
                token=None,
                user_id=None,
                end_user_id=None,
                team_id=None,
                response_cost=5.0,
                parent_otel_span=None,
                tags=["test-tag"],
            )

            await asyncio.sleep(0.1)

            mock_get_cache.assert_awaited_once_with(key="tag:test-tag")
            mock_set_cache.assert_awaited_once()

            call_args = mock_set_cache.call_args
            cache_list = call_args.kwargs["cache_list"]

            assert len(cache_list) == 1
            cache_key, cache_value = cache_list[0]
            assert cache_key == "tag:test-tag"
            assert cache_value["spend"] == 15.0


@pytest.mark.asyncio
async def test_tag_cache_update_multiple_tags():
    """
    Test that multiple tags are updated in cache.
    """
    from litellm.caching.caching import DualCache
    from litellm.proxy.proxy_server import user_api_key_cache

    cache = DualCache()

    setattr(
        litellm.proxy.proxy_server,
        "user_api_key_cache",
        cache,
    )

    mock_tag1_obj = {"tag_name": "tag1", "spend": 10.0}
    mock_tag2_obj = {"tag_name": "tag2", "spend": 20.0}

    async def mock_get_cache_side_effect(key):
        if key == "tag:tag1":
            return mock_tag1_obj
        elif key == "tag:tag2":
            return mock_tag2_obj
        return None

    with patch.object(cache, "async_get_cache", new=AsyncMock(side_effect=mock_get_cache_side_effect)) as mock_get_cache:
        with patch.object(cache, "async_set_cache_pipeline", new=AsyncMock()) as mock_set_cache:
            await litellm.proxy.proxy_server.update_cache(
                token=None,
                user_id=None,
                end_user_id=None,
                team_id=None,
                response_cost=5.0,
                parent_otel_span=None,
                tags=["tag1", "tag2"],
            )

            await asyncio.sleep(0.1)

            assert mock_get_cache.call_count == 2
            mock_set_cache.assert_awaited_once()

            call_args = mock_set_cache.call_args
            cache_list = call_args.kwargs["cache_list"]

            assert len(cache_list) == 2

            tag_updates = {cache_key: cache_value for cache_key, cache_value in cache_list}
            assert "tag:tag1" in tag_updates
            assert "tag:tag2" in tag_updates
            assert tag_updates["tag:tag1"]["spend"] == 15.0
            assert tag_updates["tag:tag2"]["spend"] == 25.0


@pytest.mark.asyncio
async def test_init_sso_settings_in_db():
    """
    Test that _init_sso_settings_in_db properly loads SSO settings from database,
    uppercases keys, and calls _decrypt_and_set_db_env_variables.
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: SSO settings exist in database
    mock_sso_config = MagicMock()
    mock_sso_config.sso_settings = {
        "google_client_id": "test-client-id",
        "google_client_secret": "test-client-secret",
        "microsoft_client_id": "ms-client-id",
        "microsoft_client_secret": "ms-client-secret",
    }

    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock(
        return_value=mock_sso_config
    )

    # Mock _decrypt_and_set_db_env_variables
    with patch.object(
        proxy_config, "_decrypt_and_set_db_env_variables"
    ) as mock_decrypt_and_set:
        await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client)

        # Verify find_unique was called with correct parameters
        mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with(
            where={"id": "sso_config"}
        )

        # Verify _decrypt_and_set_db_env_variables was called with uppercased keys
        mock_decrypt_and_set.assert_called_once()
        call_args = mock_decrypt_and_set.call_args
        uppercased_settings = call_args.kwargs["environment_variables"]

        # Verify all keys are uppercased
        assert "GOOGLE_CLIENT_ID" in uppercased_settings
        assert "GOOGLE_CLIENT_SECRET" in uppercased_settings
        assert "MICROSOFT_CLIENT_ID" in uppercased_settings
        assert "MICROSOFT_CLIENT_SECRET" in uppercased_settings

        # Verify values are preserved
        assert uppercased_settings["GOOGLE_CLIENT_ID"] == "test-client-id"
        assert uppercased_settings["GOOGLE_CLIENT_SECRET"] == "test-client-secret"
        assert uppercased_settings["MICROSOFT_CLIENT_ID"] == "ms-client-id"
        assert uppercased_settings["MICROSOFT_CLIENT_SECRET"] == "ms-client-secret"

        # Verify original lowercase keys are not present
        assert "google_client_id" not in uppercased_settings
        assert "microsoft_client_id" not in uppercased_settings


@pytest.mark.asyncio
async def test_init_sso_settings_in_db_no_settings():
    """
    Test that _init_sso_settings_in_db handles the case when no SSO settings exist in database.
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Mock prisma client to return None (no SSO settings)
    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock(return_value=None)

    # Mock _decrypt_and_set_db_env_variables
    with patch.object(
        proxy_config, "_decrypt_and_set_db_env_variables"
    ) as mock_decrypt_and_set:
        await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client)

        # Verify find_unique was called
        mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with(
            where={"id": "sso_config"}
        )

        # Verify _decrypt_and_set_db_env_variables was NOT called when no settings exist
        mock_decrypt_and_set.assert_not_called()


@pytest.mark.asyncio
async def test_init_sso_settings_in_db_error_handling():
    """
    Test that _init_sso_settings_in_db handles database errors gracefully.
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Mock prisma client to raise an exception
    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock(
        side_effect=Exception("Database connection error")
    )

    # The method should not raise an exception, it should log it instead
    try:
        await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client)
        # If we get here, the exception was handled properly
        assert True
    except Exception as e:
        # The exception should be caught and logged, not propagated
        pytest.fail(f"Exception should have been caught and logged, but was raised: {e}")


@pytest.mark.asyncio
async def test_init_sso_settings_in_db_empty_settings():
    """
    Test that _init_sso_settings_in_db handles empty SSO settings dictionary.
    """
    from unittest.mock import AsyncMock, MagicMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Mock SSO config with empty settings dictionary
    mock_sso_config = MagicMock()
    mock_sso_config.sso_settings = {}

    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock(
        return_value=mock_sso_config
    )

    # Mock _decrypt_and_set_db_env_variables
    with patch.object(
        proxy_config, "_decrypt_and_set_db_env_variables"
    ) as mock_decrypt_and_set:
        await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client)

        # Verify find_unique was called
        mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with(
            where={"id": "sso_config"}
        )

        # Verify _decrypt_and_set_db_env_variables was called with empty dict
        mock_decrypt_and_set.assert_called_once()
        call_args = mock_decrypt_and_set.call_args
        uppercased_settings = call_args.kwargs["environment_variables"]

        # Verify empty dictionary
        assert uppercased_settings == {}


def test_update_config_fields_uppercases_env_vars(monkeypatch):
    """
    Ensure environment variables pulled from DB are uppercased when applied so
    integrations like Datadog that expect uppercase env keys can read them.
    """
    from litellm.proxy.proxy_server import ProxyConfig

    for key in ["DD_API_KEY", "DD_SITE", "dd_api_key", "dd_site"]:
        monkeypatch.delenv(key, raising=False)

    proxy_config = ProxyConfig()
    updated_config = proxy_config._update_config_fields(
        current_config={},
        param_name="environment_variables",
        db_param_value={"dd_api_key": "test-api-key", "dd_site": "us5.datadoghq.com"},
    )

    env_vars = updated_config.get("environment_variables", {})
    assert env_vars["DD_API_KEY"] == "test-api-key"
    assert env_vars["DD_SITE"] == "us5.datadoghq.com"
    assert os.environ.get("DD_API_KEY") == "test-api-key"
    assert os.environ.get("DD_SITE") == "us5.datadoghq.com"


def test_get_prompt_spec_for_db_prompt_with_versions():
    """
    Test that _get_prompt_spec_for_db_prompt correctly converts database prompts
    to PromptSpec with versioned naming convention.
    """
    from unittest.mock import MagicMock

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Mock database prompt version 1
    mock_prompt_v1 = MagicMock()
    mock_prompt_v1.model_dump.return_value = {
        "id": "uuid-1",
        "prompt_id": "chat_prompt",
        "version": 1,
        "litellm_params": '{"prompt_id": "chat_prompt", "prompt_integration": "dotprompt", "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "v1 content"}]}',
        "prompt_info": '{"prompt_type": "db"}',
        "created_at": "2024-01-01T00:00:00",
        "updated_at": "2024-01-01T00:00:00",
    }

    # Mock database prompt version 2
    mock_prompt_v2 = MagicMock()
    mock_prompt_v2.model_dump.return_value = {
        "id": "uuid-2",
        "prompt_id": "chat_prompt",
        "version": 2,
        "litellm_params": '{"prompt_id": "chat_prompt", "prompt_integration": "dotprompt", "model": "gpt-4", "messages": [{"role": "user", "content": "v2 content"}]}',
        "prompt_info": '{"prompt_type": "db"}',
        "created_at": "2024-01-02T00:00:00",
        "updated_at": "2024-01-02T00:00:00",
    }

    # Test version 1
    prompt_spec_v1 = proxy_config._get_prompt_spec_for_db_prompt(db_prompt=mock_prompt_v1)
    assert prompt_spec_v1.prompt_id == "chat_prompt.v1"

    # Test version 2
    prompt_spec_v2 = proxy_config._get_prompt_spec_for_db_prompt(db_prompt=mock_prompt_v2)
    assert prompt_spec_v2.prompt_id == "chat_prompt.v2"


def test_root_redirect_when_docs_url_not_root_and_redirect_url_set(monkeypatch):
    from fastapi.responses import RedirectResponse

    from litellm.proxy.proxy_server import cleanup_router_config_variables
    from litellm.proxy.utils import _get_docs_url

    cleanup_router_config_variables()
    filepath = os.path.dirname(os.path.abspath(__file__))
    config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
    # Ensure docs are mounted on a non-root path to trigger redirect logic
    monkeypatch.setenv("DOCS_URL", "/docs")

    test_redirect_url = "/ui"
    monkeypatch.setenv("ROOT_REDIRECT_URL", test_redirect_url)

    asyncio.run(initialize(config=config_fp, debug=True))

    docs_url = _get_docs_url()
    root_redirect_url = os.getenv("ROOT_REDIRECT_URL")

    # Remove any existing "/" route that might interfere
    routes_to_remove = []
    for route in app.routes:
        if hasattr(route, "path") and route.path == "/":
            if hasattr(route, "methods") and "GET" in route.methods:
                routes_to_remove.append(route)
            elif not hasattr(route, "methods"):  # Catch-all routes
                routes_to_remove.append(route)

    for route in routes_to_remove:
        app.routes.remove(route)

    # Add the redirect route if conditions are met (matching the actual implementation)
    if docs_url != "/" and root_redirect_url:
        @app.get("/", include_in_schema=False)
        async def root_redirect():
            return RedirectResponse(url=root_redirect_url)

    client = TestClient(app)
    response = client.get("/", follow_redirects=False)
    assert response.status_code == 307
    assert response.headers["location"] == test_redirect_url


@pytest.mark.asyncio
async def test_get_image_non_root_uses_var_lib_assets_dir(monkeypatch):
    """
    Test that get_image uses /var/lib/litellm/assets when LITELLM_NON_ROOT is true.
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import get_image

    # Set LITELLM_NON_ROOT to true
    monkeypatch.setenv("LITELLM_NON_ROOT", "true")
    monkeypatch.delenv("UI_LOGO_PATH", raising=False)

    # Mock os.path operations
    with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \
         patch("litellm.proxy.proxy_server.os.path.exists", return_value=True), \
         patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \
         patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response:

        # Setup mock_getenv to return empty string for UI_LOGO_PATH
        def getenv_side_effect(key, default=""):
            if key == "UI_LOGO_PATH":
                return ""
            elif key == "LITELLM_NON_ROOT":
                return "true"
            return default

        mock_getenv.side_effect = getenv_side_effect

        # Call the function
        await get_image()

        # Verify makedirs was called with /var/lib/litellm/assets
        mock_makedirs.assert_called_once_with("/var/lib/litellm/assets", exist_ok=True)


@pytest.mark.asyncio
async def test_get_image_non_root_fallback_to_default_logo(monkeypatch):
    """
    Test that get_image falls back to default_site_logo when logo doesn't exist
    in /var/lib/litellm/assets for non-root case.
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import get_image

    # Set LITELLM_NON_ROOT to true
    monkeypatch.setenv("LITELLM_NON_ROOT", "true")
    monkeypatch.delenv("UI_LOGO_PATH", raising=False)

    # Track path.exists calls to verify it checks /var/lib/litellm/assets/logo.jpg
    exists_calls = []

    def exists_side_effect(path):
        exists_calls.append(path)
        # Return False for /var/lib/litellm/assets/logo.jpg to trigger fallback
        if "/var/lib/litellm/assets/logo.jpg" in path:
            return False
        return True

    # Mock os.path operations
    with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \
         patch("litellm.proxy.proxy_server.os.path.exists", side_effect=exists_side_effect), \
         patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \
         patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response:

        # Setup mock_getenv
        def getenv_side_effect(key, default=""):
            if key == "UI_LOGO_PATH":
                return ""
            elif key == "LITELLM_NON_ROOT":
                return "true"
            return default

        mock_getenv.side_effect = getenv_side_effect

        # Call the function
        await get_image()

        # Verify makedirs was called with /var/lib/litellm/assets
        mock_makedirs.assert_called_once_with("/var/lib/litellm/assets", exist_ok=True)

        # Verify that exists was called to check /var/lib/litellm/assets/logo.jpg
        assets_logo_path = "/var/lib/litellm/assets/logo.jpg"
        assert any(assets_logo_path in str(call) for call in exists_calls), \
            f"Should check if {assets_logo_path} exists"

        # Verify FileResponse was called (with fallback logo)
        assert mock_file_response.called, "FileResponse should be called"


@pytest.mark.asyncio
async def test_get_image_root_case_uses_current_dir(monkeypatch):
    """
    Test that get_image uses current_dir when LITELLM_NON_ROOT is not true.
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import get_image

    # Don't set LITELLM_NON_ROOT (or set it to false)
    monkeypatch.delenv("LITELLM_NON_ROOT", raising=False)
    monkeypatch.delenv("UI_LOGO_PATH", raising=False)

    # Mock os.path operations
    with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \
         patch("litellm.proxy.proxy_server.os.path.exists", return_value=True), \
         patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \
         patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response:

        # Setup mock_getenv
        def getenv_side_effect(key, default=""):
            if key == "UI_LOGO_PATH":
                return ""
            elif key == "LITELLM_NON_ROOT":
                return ""  # Not set or empty
            return default

        mock_getenv.side_effect = getenv_side_effect

        # Call the function
        await get_image()

        # Verify makedirs was NOT called with /var/lib/litellm/assets (should not create it for root case)
        var_lib_assets_calls = [
            call for call in mock_makedirs.call_args_list
            if "/var/lib/litellm/assets" in str(call)
        ]
        assert len(var_lib_assets_calls) == 0, "Should not create /var/lib/litellm/assets for root case"

        # Verify FileResponse was called
        assert mock_file_response.called, "FileResponse should be called"


def test_get_config_normalizes_string_callbacks(monkeypatch):
    """
    Test that /get/config/callbacks normalizes string callbacks to lists.
    """
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    config_data = {
        "litellm_settings": {
            "success_callback": "langfuse",
            "failure_callback": None,
            "callbacks": ["prometheus", "datadog"],
        },
        "general_settings": {},
        "environment_variables": {},
    }

    mock_router = MagicMock()
    mock_router.get_settings.return_value = {}
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr(
        proxy_config, "get_config", AsyncMock(return_value=config_data)
    )

    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: MagicMock()

    client = TestClient(app)
    try:
        response = client.get("/get/config/callbacks")
    finally:
        app.dependency_overrides = original_overrides

    assert response.status_code == 200
    callbacks = response.json()["callbacks"]

    success_callbacks = [cb["name"] for cb in callbacks if cb.get("type") == "success"]
    failure_callbacks = [cb["name"] for cb in callbacks if cb.get("type") == "failure"]
    success_and_failure_callbacks = [
        cb["name"] for cb in callbacks if cb.get("type") == "success_and_failure"
    ]

    assert "langfuse" in success_callbacks
    assert len(failure_callbacks) == 0
    assert "prometheus" in success_and_failure_callbacks
    assert "datadog" in success_and_failure_callbacks


def test_deep_merge_dicts_skips_none_and_empty_lists(monkeypatch):
    """
    Test that _update_config_fields deep merge skips None values and empty lists.
    """
    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    current_config = {
        "general_settings": {
            "max_parallel_requests": 10,
            "allowed_models": ["gpt-3.5-turbo", "gpt-4"],
            "nested": {
                "key1": "value1",
                "key2": "value2",
            },
        }
    }

    db_param_value = {
        "max_parallel_requests": None,
        "allowed_models": [],
        "new_key": "new_value",
        "nested": {
            "key1": "updated_value1",
            "key3": "value3",
        },
    }

    result = proxy_config._update_config_fields(
        current_config, "general_settings", db_param_value
    )

    assert result["general_settings"]["max_parallel_requests"] == 10
    assert result["general_settings"]["allowed_models"] == ["gpt-3.5-turbo", "gpt-4"]
    assert result["general_settings"]["new_key"] == "new_value"
    assert result["general_settings"]["nested"]["key1"] == "updated_value1"
    assert result["general_settings"]["nested"]["key2"] == "value2"
    assert result["general_settings"]["nested"]["key3"] == "value3"


@pytest.mark.asyncio
async def test_get_hierarchical_router_settings():
    """
    Test _get_hierarchical_router_settings method's priority order: Key > Team > Global
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: Returns None when prisma_client is None
    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=None,
        prisma_client=None,
    )
    assert result is None

    # Test Case 2: Returns key-level router_settings when available (as dict)
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.router_settings = {"routing_strategy": "key-level", "timeout": 10}
    mock_user_api_key_dict.team_id = None

    mock_prisma_client = MagicMock()

    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=mock_user_api_key_dict,
        prisma_client=mock_prisma_client,
    )
    assert result == {"routing_strategy": "key-level", "timeout": 10}

    # Test Case 3: Returns key-level router_settings when available (as YAML string)
    mock_user_api_key_dict.router_settings = "routing_strategy: key-yaml\ntimeout: 20"
    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=mock_user_api_key_dict,
        prisma_client=mock_prisma_client,
    )
    assert result == {"routing_strategy": "key-yaml", "timeout": 20}

    # Test Case 4: Falls back to team-level router_settings when key-level is not available
    mock_user_api_key_dict.router_settings = None
    mock_user_api_key_dict.team_id = "team-123"

    mock_team_obj = MagicMock()
    mock_team_obj.router_settings = {"routing_strategy": "team-level", "timeout": 30}

    mock_prisma_client.db.litellm_teamtable.find_unique = AsyncMock(
        return_value=mock_team_obj
    )

    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=mock_user_api_key_dict,
        prisma_client=mock_prisma_client,
    )
    assert result == {"routing_strategy": "team-level", "timeout": 30}
    mock_prisma_client.db.litellm_teamtable.find_unique.assert_called_once_with(
        where={"team_id": "team-123"}
    )

    # Test Case 5: Falls back to global router_settings when neither key nor team settings are available
    mock_user_api_key_dict.router_settings = None
    mock_prisma_client.db.litellm_teamtable.find_unique = AsyncMock(return_value=None)

    mock_db_config = MagicMock()
    mock_db_config.param_value = {"routing_strategy": "global-level", "timeout": 40}

    mock_prisma_client.db.litellm_config.find_first = AsyncMock(
        return_value=mock_db_config
    )

    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=mock_user_api_key_dict,
        prisma_client=mock_prisma_client,
    )
    assert result == {"routing_strategy": "global-level", "timeout": 40}
    mock_prisma_client.db.litellm_config.find_first.assert_called_once_with(
        where={"param_name": "router_settings"}
    )

    # Test Case 6: Returns None when no settings are found
    mock_user_api_key_dict.router_settings = None
    mock_prisma_client.db.litellm_teamtable.find_unique = AsyncMock(return_value=None)
    mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None)

    result = await proxy_config._get_hierarchical_router_settings(
        user_api_key_dict=mock_user_api_key_dict,
        prisma_client=mock_prisma_client,
    )
    assert result is None


@pytest.mark.asyncio
async def test_model_info_v2_pagination_basic(monkeypatch):
    """
    Test basic pagination functionality for /v2/model/info endpoint.
    Tests multiple pages with different page sizes.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create 75 mock models for testing pagination
    mock_models = [
        {
            "model_name": f"model-{i}",
            "litellm_params": {"model": f"gpt-{i}"},
            "model_info": {"id": f"model-{i}"},
        }
        for i in range(1, 76)  # 75 models total
    ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_models

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test page 1 with size 25 (should return models 1-25)
        response = client.get("/v2/model/info", params={"page": 1, "size": 25})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 75
        assert data["current_page"] == 1
        assert data["size"] == 25
        assert data["total_pages"] == 3  # ceil(75/25) = 3
        assert len(data["data"]) == 25
        assert data["data"][0]["model_name"] == "model-1"
        assert data["data"][24]["model_name"] == "model-25"

        # Test page 2 with size 25 (should return models 26-50)
        response = client.get("/v2/model/info", params={"page": 2, "size": 25})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 75
        assert data["current_page"] == 2
        assert data["size"] == 25
        assert data["total_pages"] == 3
        assert len(data["data"]) == 25
        assert data["data"][0]["model_name"] == "model-26"
        assert data["data"][24]["model_name"] == "model-50"

        # Test page 3 with size 25 (should return models 51-75)
        response = client.get("/v2/model/info", params={"page": 3, "size": 25})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 75
        assert data["current_page"] == 3
        assert data["size"] == 25
        assert data["total_pages"] == 3
        assert len(data["data"]) == 25
        assert data["data"][0]["model_name"] == "model-51"
        assert data["data"][24]["model_name"] == "model-75"

        # Test different page size (size 10)
        response = client.get("/v2/model/info", params={"page": 1, "size": 10})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 75
        assert data["current_page"] == 1
        assert data["size"] == 10
        assert data["total_pages"] == 8  # ceil(75/10) = 8
        assert len(data["data"]) == 10

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_pagination_edge_cases(monkeypatch):
    """
    Test edge cases for pagination in /v2/model/info endpoint.
    Tests empty results, last page with partial results, and boundary conditions.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test Case 1: Empty model list (no models configured)
        mock_router_empty = MagicMock()
        mock_router_empty.model_list = []
        monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router_empty)

        response = client.get("/v2/model/info", params={"page": 1, "size": 25})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 0
        assert data["current_page"] == 1
        assert data["size"] == 25
        assert data["total_pages"] == 0
        assert len(data["data"]) == 0

        # Test Case 2: Last page with partial results (23 models, page size 10)
        mock_models_partial = [
            {
                "model_name": f"model-{i}",
                "litellm_params": {"model": f"gpt-{i}"},
                "model_info": {"id": f"model-{i}"},
            }
            for i in range(1, 24)  # 23 models total
        ]
        mock_router_partial = MagicMock()
        mock_router_partial.model_list = mock_models_partial
        monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router_partial)

        # Page 1 should have 10 models
        response = client.get("/v2/model/info", params={"page": 1, "size": 10})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 23
        assert data["current_page"] == 1
        assert data["total_pages"] == 3  # ceil(23/10) = 3
        assert len(data["data"]) == 10

        # Page 2 should have 10 models
        response = client.get("/v2/model/info", params={"page": 2, "size": 10})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 23
        assert data["current_page"] == 2
        assert data["total_pages"] == 3
        assert len(data["data"]) == 10

        # Page 3 (last page) should have only 3 models
        response = client.get("/v2/model/info", params={"page": 3, "size": 10})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 23
        assert data["current_page"] == 3
        assert data["total_pages"] == 3
        assert len(data["data"]) == 3
        assert data["data"][0]["model_name"] == "model-21"
        assert data["data"][2]["model_name"] == "model-23"

        # Test Case 3: Page beyond available pages (should return empty data)
        response = client.get("/v2/model/info", params={"page": 4, "size": 10})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 23
        assert data["current_page"] == 4
        assert data["total_pages"] == 3
        assert len(data["data"]) == 0  # No data for page beyond total_pages

        # Test Case 4: Single model with page size 1
        mock_models_single = [
            {
                "model_name": "single-model",
                "litellm_params": {"model": "gpt-4"},
                "model_info": {"id": "single-model"},
            }
        ]
        mock_router_single = MagicMock()
        mock_router_single.model_list = mock_models_single
        monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router_single)

        response = client.get("/v2/model/info", params={"page": 1, "size": 1})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert data["current_page"] == 1
        assert data["total_pages"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_name"] == "single-model"

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_search_config_models(monkeypatch):
    """
    Test search parameter for config models (models from config.yaml).
    Config models don't have db_model=True in model_info.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create mock config models (no db_model flag or db_model=False)
    mock_config_models = [
        {
            "model_name": "gpt-4-turbo",
            "litellm_params": {"model": "gpt-4-turbo"},
            "model_info": {"id": "gpt-4-turbo"},  # No db_model flag = config model
        },
        {
            "model_name": "gpt-3.5-turbo",
            "litellm_params": {"model": "gpt-3.5-turbo"},
            "model_info": {"id": "gpt-3.5-turbo", "db_model": False},  # Explicitly config model
        },
        {
            "model_name": "claude-3-opus",
            "litellm_params": {"model": "claude-3-opus"},
            "model_info": {"id": "claude-3-opus"},  # No db_model flag = config model
        },
        {
            "model_name": "gemini-pro",
            "litellm_params": {"model": "gemini-pro"},
            "model_info": {"id": "gemini-pro"},  # No db_model flag = config model
        },
    ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_config_models

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test search for "gpt" - should return gpt-4-turbo and gpt-3.5-turbo
        response = client.get("/v2/model/info", params={"search": "gpt"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 2  # Only config models matching search
        assert len(data["data"]) == 2
        model_names = [m["model_name"] for m in data["data"]]
        assert "gpt-4-turbo" in model_names
        assert "gpt-3.5-turbo" in model_names
        assert "claude-3-opus" not in model_names
        assert "gemini-pro" not in model_names

        # Test search for "claude" - should return claude-3-opus
        response = client.get("/v2/model/info", params={"search": "claude"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_name"] == "claude-3-opus"

        # Test case-insensitive search
        response = client.get("/v2/model/info", params={"search": "GPT"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 2
        assert len(data["data"]) == 2

        # Test partial match
        response = client.get("/v2/model/info", params={"search": "turbo"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 2
        assert len(data["data"]) == 2
        model_names = [m["model_name"] for m in data["data"]]
        assert "gpt-4-turbo" in model_names
        assert "gpt-3.5-turbo" in model_names

        # Test search with no matches
        response = client.get("/v2/model/info", params={"search": "nonexistent"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 0
        assert len(data["data"]) == 0

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_search_db_models(monkeypatch):
    """
    Test search parameter for db models (models from database).
    DB models have db_model=True and id in model_info.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create mock db models (db_model=True with id)
    mock_db_models_in_router = [
        {
            "model_name": "db-gpt-4",
            "litellm_params": {"model": "gpt-4"},
            "model_info": {"id": "db-model-1", "db_model": True},  # DB model
        },
        {
            "model_name": "db-claude-3",
            "litellm_params": {"model": "claude-3"},
            "model_info": {"id": "db-model-2", "db_model": True},  # DB model
        },
    ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_db_models_in_router

    # Mock prisma_client with database query methods
    mock_db_models_from_db = [
        MagicMock(
            model_id="db-model-3",
            model_name="db-gemini-pro",
            litellm_params='{"model": "gemini-pro"}',
            model_info='{"id": "db-model-3", "db_model": true}',
        ),
        MagicMock(
            model_id="db-model-4",
            model_name="db-gpt-3.5",
            litellm_params='{"model": "gpt-3.5-turbo"}',
            model_info='{"id": "db-model-4", "db_model": true}',
        ),
    ]

    # Mock the database count and find_many methods dynamically based on search
    async def mock_db_count_func(*args, **kwargs):
        where_condition = kwargs.get("where", {})
        search_term = where_condition.get("model_name", {}).get("contains", "")
        excluded_ids = where_condition.get("model_id", {}).get("not", {}).get("in", [])

        # Count models matching search term but not in excluded_ids
        count = 0
        for model in mock_db_models_from_db:
            if search_term.lower() in model.model_name.lower():
                if model.model_id not in excluded_ids:
                    count += 1
        return count

    async def mock_db_find_many_func(*args, **kwargs):
        where_condition = kwargs.get("where", {})
        search_term = where_condition.get("model_name", {}).get("contains", "")
        excluded_ids = where_condition.get("model_id", {}).get("not", {}).get("in", [])
        take = kwargs.get("take", 10)

        # Return models matching search term but not in excluded_ids
        result = []
        for model in mock_db_models_from_db:
            if search_term.lower() in model.model_name.lower():
                if model.model_id not in excluded_ids:
                    result.append(model)
                    if len(result) >= take:
                        break
        return result

    mock_db_count = AsyncMock(side_effect=mock_db_count_func)
    mock_db_find_many = AsyncMock(side_effect=mock_db_find_many_func)

    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_proxymodeltable.count = mock_db_count
    mock_prisma_client.db.litellm_proxymodeltable.find_many = mock_db_find_many

    # Mock proxy_config.decrypt_model_list_from_db to return router-format models
    def mock_decrypt_models(db_models_list):
        result = []
        for db_model in db_models_list:
            result.append(
                {
                    "model_name": db_model.model_name,
                    "litellm_params": {"model": db_model.model_name.replace("db-", "")},
                    "model_info": {"id": db_model.model_id, "db_model": True},
                }
            )
        return result

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)
    monkeypatch.setattr(proxy_config, "decrypt_model_list_from_db", mock_decrypt_models)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test search for "gpt" - should return db-gpt-4 from router and db-gpt-3.5 from db
        response = client.get("/v2/model/info", params={"search": "gpt"})
        assert response.status_code == 200
        data = response.json()
        # Should have db-gpt-4 from router + db-gpt-3.5 from db = 2 total
        assert data["total_count"] == 2
        assert len(data["data"]) == 2
        model_names = [m["model_name"] for m in data["data"]]
        assert "db-gpt-4" in model_names
        assert "db-gpt-3.5" in model_names

        # Verify database was queried
        mock_db_count.assert_called()
        # Verify the where condition excludes models already in router
        call_args = mock_db_count.call_args
        assert call_args is not None
        where_condition = call_args[1]["where"]
        assert "model_name" in where_condition
        assert where_condition["model_name"]["contains"] == "gpt"
        assert where_condition["model_name"]["mode"] == "insensitive"

        # Test search for "claude" - should return db-claude-3 from router only
        response = client.get("/v2/model/info", params={"search": "claude"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_name"] == "db-claude-3"

        # Test search for "gemini" - should return db-gemini-pro from db only
        response = client.get("/v2/model/info", params={"search": "gemini"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_name"] == "db-gemini-pro"

        # Test case-insensitive search
        response = client.get("/v2/model/info", params={"search": "GPT"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 2

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_filter_by_model_id(monkeypatch):
    """
    Test modelId parameter for filtering by specific model ID.
    Tests that modelId searches in router config first, then database.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create mock config models
    mock_config_models = [
        {
            "model_name": "gpt-4-turbo",
            "litellm_params": {"model": "gpt-4-turbo"},
            "model_info": {"id": "config-model-1"},
        },
        {
            "model_name": "claude-3-opus",
            "litellm_params": {"model": "claude-3-opus"},
            "model_info": {"id": "config-model-2"},
        },
    ]

    # Mock llm_router with get_model_info method
    mock_router = MagicMock()
    mock_router.model_list = mock_config_models
    mock_router.get_model_info = MagicMock(
        side_effect=lambda id: next(
            (m for m in mock_config_models if m["model_info"]["id"] == id), None
        )
    )

    # Mock prisma_client for database queries
    mock_prisma_client = MagicMock()
    mock_db_table = MagicMock()
    mock_prisma_client.db.litellm_proxymodeltable = mock_db_table

    # Mock database model
    mock_db_model = MagicMock()
    mock_db_model.model_id = "db-model-1"
    mock_db_model.model_name = "db-gpt-3.5"
    mock_db_model.litellm_params = '{"model": "gpt-3.5-turbo"}'
    mock_db_model.model_info = '{"id": "db-model-1", "db_model": true}'

    # Mock find_unique to return db model when searching for db-model-1
    async def mock_find_unique(where):
        if where.get("model_id") == "db-model-1":
            return mock_db_model
        return None

    mock_db_table.find_unique = AsyncMock(side_effect=mock_find_unique)

    # Mock proxy_config.decrypt_model_list_from_db
    def mock_decrypt_models(db_models_list):
        if db_models_list:
            return [
                {
                    "model_name": db_models_list[0].model_name,
                    "litellm_params": {"model": "gpt-3.5-turbo"},
                    "model_info": {"id": db_models_list[0].model_id, "db_model": True},
                }
            ]
        return []

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)
    monkeypatch.setattr(proxy_config, "decrypt_model_list_from_db", mock_decrypt_models)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test Case 1: Filter by modelId that exists in config
        response = client.get("/v2/model/info", params={"modelId": "config-model-1"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_info"]["id"] == "config-model-1"
        assert data["data"][0]["model_name"] == "gpt-4-turbo"
        # Verify router.get_model_info was called
        mock_router.get_model_info.assert_called_with(id="config-model-1")

        # Test Case 2: Filter by modelId that exists in database (not in config)
        response = client.get("/v2/model/info", params={"modelId": "db-model-1"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 1
        assert len(data["data"]) == 1
        assert data["data"][0]["model_info"]["id"] == "db-model-1"
        assert data["data"][0]["model_name"] == "db-gpt-3.5"
        # Verify database was queried
        mock_db_table.find_unique.assert_called()

        # Test Case 3: Filter by modelId that doesn't exist
        mock_db_table.find_unique = AsyncMock(return_value=None)
        response = client.get("/v2/model/info", params={"modelId": "non-existent-model"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 0
        assert len(data["data"]) == 0

        # Test Case 4: Filter by modelId with search parameter (should filter further)
        response = client.get(
            "/v2/model/info", params={"modelId": "config-model-1", "search": "claude"}
        )
        assert response.status_code == 200
        data = response.json()
        # config-model-1 is gpt-4-turbo, doesn't match "claude", so should return empty
        assert data["total_count"] == 0
        assert len(data["data"]) == 0

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_filter_by_team_id(monkeypatch):
    """
    Test teamId parameter for filtering models by team ID.
    Tests that teamId filters models based on direct_access or access_via_team_ids.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import LiteLLM_TeamTable, UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create mock models with different access configurations
    mock_models = [
        {
            "model_name": "model-direct-access",
            "litellm_params": {"model": "gpt-4"},
            "model_info": {
                "id": "model-1",
                "direct_access": True,  # Should be included
            },
        },
        {
            "model_name": "model-team-access",
            "litellm_params": {"model": "claude-3"},
            "model_info": {
                "id": "model-2",
                "direct_access": False,
                "access_via_team_ids": ["team-123"],  # Should be included
            },
        },
        {
            "model_name": "model-no-access",
            "litellm_params": {"model": "gemini-pro"},
            "model_info": {
                "id": "model-3",
                "direct_access": False,
                "access_via_team_ids": ["team-456"],  # Should NOT be included
            },
        },
        {
            "model_name": "model-multiple-teams",
            "litellm_params": {"model": "gpt-3.5"},
            "model_info": {
                "id": "model-4",
                "direct_access": False,
                "access_via_team_ids": ["team-789", "team-123"],  # Should be included
            },
        },
    ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_models

    # Mock get_model_list to return models based on model_name filter
    def mock_get_model_list(model_name=None, team_id=None):
        if model_name:
            return [m for m in mock_models if m["model_name"] == model_name]
        return mock_models

    mock_router.get_model_list = MagicMock(side_effect=mock_get_model_list)

    # Mock team database object - team has access to specific models
    mock_team_db_object = MagicMock()
    mock_team_db_object.model_dump.return_value = {
        "team_id": "team-123",
        "models": ["model-direct-access", "model-team-access", "model-multiple-teams"],  # Specific models
    }

    # Mock prisma_client
    mock_prisma_client = MagicMock()
    mock_team_table = MagicMock()
    mock_prisma_client.db.litellm_teamtable = mock_team_table
    mock_team_table.find_unique = AsyncMock(return_value=mock_team_db_object)

    # Mock LiteLLM_TeamTable - team has access to specific models
    mock_team_object = LiteLLM_TeamTable(
        team_id="team-123",
        models=["model-direct-access", "model-team-access", "model-multiple-teams"],
    )

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)
    # Mock LiteLLM_TeamTable instantiation
    monkeypatch.setattr(
        "litellm.proxy.proxy_server.LiteLLM_TeamTable",
        lambda **kwargs: mock_team_object,
    )

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test Case 1: Filter by teamId - should return models with direct_access=True or team-123 in access_via_team_ids
        response = client.get("/v2/model/info", params={"teamId": "team-123"})
        assert response.status_code == 200
        data = response.json()
        # Should include: model-1 (direct_access), model-2 (team-123 in access_via_team_ids), model-4 (team-123 in access_via_team_ids)
        # Should NOT include: model-3 (team-456 only)
        assert data["total_count"] == 3
        assert len(data["data"]) == 3
        model_ids = [m["model_info"]["id"] for m in data["data"]]
        assert "model-1" in model_ids  # direct_access
        assert "model-2" in model_ids  # team-123 in access_via_team_ids
        assert "model-4" in model_ids  # team-123 in access_via_team_ids
        assert "model-3" not in model_ids  # Should be excluded

        # Test Case 2: Filter by teamId that doesn't exist - should return empty list
        mock_team_table.find_unique = AsyncMock(return_value=None)
        response = client.get("/v2/model/info", params={"teamId": "non-existent-team"})
        assert response.status_code == 200
        data = response.json()
        assert data["total_count"] == 0
        assert len(data["data"]) == 0

        # Test Case 3: Filter by different teamId - should only return models with that team in access_via_team_ids
        mock_team_db_object_456 = MagicMock()
        mock_team_db_object_456.model_dump.return_value = {
            "team_id": "team-456",
            "models": ["model-no-access"],  # Team has access to model-no-access
        }
        mock_team_table.find_unique = AsyncMock(return_value=mock_team_db_object_456)
        mock_team_object_456 = LiteLLM_TeamTable(
            team_id="team-456",
            models=["model-no-access"],
        )
        monkeypatch.setattr(
            "litellm.proxy.proxy_server.LiteLLM_TeamTable",
            lambda **kwargs: mock_team_object_456,
        )

        response = client.get("/v2/model/info", params={"teamId": "team-456"})
        assert response.status_code == 200
        data = response.json()
        # Should include: model-1 (direct_access), model-3 (team-456 in access_via_team_ids)
        # Should NOT include: model-2 (team-123 only), model-4 (team-789 and team-123, but not team-456)
        assert data["total_count"] >= 2
        model_ids = [m["model_info"]["id"] for m in data["data"]]
        assert "model-1" in model_ids  # direct_access
        assert "model-3" in model_ids  # team-456 in access_via_team_ids

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
@pytest.mark.parametrize(
    "sort_by,sort_order,expected_order",
    [
        # Test model_name sorting
        ("model_name", "asc", ["a-model", "b-model", "z-model"]),
        ("model_name", "desc", ["z-model", "b-model", "a-model"]),
        # Test created_at sorting
        ("created_at", "asc", ["old-model", "mid-model", "new-model"]),
        ("created_at", "desc", ["new-model", "mid-model", "old-model"]),
        # Test updated_at sorting
        ("updated_at", "asc", ["old-updated", "mid-updated", "new-updated"]),
        ("updated_at", "desc", ["new-updated", "mid-updated", "old-updated"]),
        # Test costs sorting
        ("costs", "asc", ["low-cost", "mid-cost", "high-cost"]),
        ("costs", "desc", ["high-cost", "mid-cost", "low-cost"]),
        # Test status sorting (False/config models come before True/db models in asc)
        ("status", "asc", ["config-model-1", "config-model-2", "db-model"]),
        ("status", "desc", ["db-model", "config-model-1", "config-model-2"]),
    ],
)
async def test_model_info_v2_sorting(monkeypatch, sort_by, sort_order, expected_order):
    """
    Test sorting functionality for /v2/model/info endpoint.
    Tests all sortBy fields (model_name, created_at, updated_at, costs, status)
    with both asc and desc sort orders.
    """
    from datetime import datetime, timedelta
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create base time for date comparisons
    base_time = datetime(2024, 1, 1, 12, 0, 0)

    # Create mock models with different values for each sort field
    mock_models = []

    if sort_by == "model_name":
        # Models with different names
        mock_models = [
            {
                "model_name": "z-model",
                "litellm_params": {"model": "z-model"},
                "model_info": {"id": "z-model"},
            },
            {
                "model_name": "a-model",
                "litellm_params": {"model": "a-model"},
                "model_info": {"id": "a-model"},
            },
            {
                "model_name": "b-model",
                "litellm_params": {"model": "b-model"},
                "model_info": {"id": "b-model"},
            },
        ]
    elif sort_by == "created_at":
        # Models with different created_at timestamps
        mock_models = [
            {
                "model_name": "new-model",
                "litellm_params": {"model": "new-model"},
                "model_info": {
                    "id": "new-model",
                    "created_at": (base_time + timedelta(days=3)).isoformat(),
                },
            },
            {
                "model_name": "old-model",
                "litellm_params": {"model": "old-model"},
                "model_info": {
                    "id": "old-model",
                    "created_at": (base_time - timedelta(days=3)).isoformat(),
                },
            },
            {
                "model_name": "mid-model",
                "litellm_params": {"model": "mid-model"},
                "model_info": {
                    "id": "mid-model",
                    "created_at": base_time.isoformat(),
                },
            },
        ]
    elif sort_by == "updated_at":
        # Models with different updated_at timestamps
        mock_models = [
            {
                "model_name": "new-updated",
                "litellm_params": {"model": "new-updated"},
                "model_info": {
                    "id": "new-updated",
                    "updated_at": (base_time + timedelta(days=3)).isoformat(),
                },
            },
            {
                "model_name": "old-updated",
                "litellm_params": {"model": "old-updated"},
                "model_info": {
                    "id": "old-updated",
                    "updated_at": (base_time - timedelta(days=3)).isoformat(),
                },
            },
            {
                "model_name": "mid-updated",
                "litellm_params": {"model": "mid-updated"},
                "model_info": {
                    "id": "mid-updated",
                    "updated_at": base_time.isoformat(),
                },
            },
        ]
    elif sort_by == "costs":
        # Models with different costs (input_cost + output_cost)
        mock_models = [
            {
                "model_name": "high-cost",
                "litellm_params": {"model": "high-cost"},
                "model_info": {
                    "id": "high-cost",
                    "input_cost_per_token": 0.00005,
                    "output_cost_per_token": 0.00015,
                },
            },
            {
                "model_name": "low-cost",
                "litellm_params": {"model": "low-cost"},
                "model_info": {
                    "id": "low-cost",
                    "input_cost_per_token": 0.00001,
                    "output_cost_per_token": 0.00003,
                },
            },
            {
                "model_name": "mid-cost",
                "litellm_params": {"model": "mid-cost"},
                "model_info": {
                    "id": "mid-cost",
                    "input_cost_per_token": 0.00003,
                    "output_cost_per_token": 0.00007,
                },
            },
        ]
    elif sort_by == "status":
        # Models with different db_model status (False = config, True = db)
        mock_models = [
            {
                "model_name": "db-model",
                "litellm_params": {"model": "db-model"},
                "model_info": {"id": "db-model", "db_model": True},
            },
            {
                "model_name": "config-model-1",
                "litellm_params": {"model": "config-model-1"},
                "model_info": {"id": "config-model-1", "db_model": False},
            },
            {
                "model_name": "config-model-2",
                "litellm_params": {"model": "config-model-2"},
                "model_info": {"id": "config-model-2", "db_model": False},
            },
        ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_models

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test sorting with specified sortBy and sortOrder
        response = client.get(
            "/v2/model/info", params={"sortBy": sort_by, "sortOrder": sort_order}
        )
        assert response.status_code == 200
        data = response.json()
        assert len(data["data"]) == len(expected_order)

        # Verify models are in expected order
        actual_order = [m["model_name"] for m in data["data"]]
        assert actual_order == expected_order, (
            f"Sorting failed for sortBy={sort_by}, sortOrder={sort_order}. "
            f"Expected: {expected_order}, Got: {actual_order}"
        )

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_model_info_v2_sorting_invalid_sort_order(monkeypatch):
    """
    Test that invalid sortOrder values return a 400 error.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy._types import UserAPIKeyAuth
    from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth

    # Create mock models
    mock_models = [
        {
            "model_name": "test-model",
            "litellm_params": {"model": "test-model"},
            "model_info": {"id": "test-model"},
        }
    ]

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.model_list = mock_models

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock proxy_config.get_config
    mock_get_config = AsyncMock(return_value={})

    # Mock user authentication
    mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth)
    mock_user_api_key_dict.user_id = "test-user"
    mock_user_api_key_dict.api_key = "test-key"
    mock_user_api_key_dict.team_models = []
    mock_user_api_key_dict.models = []

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(proxy_config, "get_config", mock_get_config)

    # Override auth dependency
    original_overrides = app.dependency_overrides.copy()
    app.dependency_overrides[user_api_key_auth] = lambda: mock_user_api_key_dict

    client = TestClient(app)
    try:
        # Test invalid sortOrder
        response = client.get(
            "/v2/model/info", params={"sortBy": "model_name", "sortOrder": "invalid"}
        )
        assert response.status_code == 400
        data = response.json()
        assert "Invalid sortOrder" in data["detail"]

    finally:
        app.dependency_overrides = original_overrides


@pytest.mark.asyncio
async def test_apply_search_filter_to_models(monkeypatch):
    """
    Test the _apply_search_filter_to_models helper function.
    Tests search filtering logic for config models, db models, and database queries.
    """
    from unittest.mock import AsyncMock, MagicMock

    from litellm.proxy.proxy_server import _apply_search_filter_to_models, proxy_config

    # Create mock models with mix of config and db models
    mock_models = [
        {
            "model_name": "gpt-4-turbo",
            "model_info": {"id": "gpt-4-turbo"},  # Config model
        },
        {
            "model_name": "db-gpt-3.5",
            "model_info": {"id": "db-model-1", "db_model": True},  # DB model in router
        },
        {
            "model_name": "claude-3-opus",
            "model_info": {"id": "claude-3-opus"},  # Config model
        },
    ]

    # Mock prisma_client
    mock_prisma_client = MagicMock()
    mock_db_table = MagicMock()
    mock_prisma_client.db.litellm_proxymodeltable = mock_db_table

    # Mock database models
    mock_db_model_1 = MagicMock(
        model_id="db-model-2",
        model_name="db-gemini-pro",
        litellm_params='{"model": "gemini-pro"}',
        model_info='{"id": "db-model-2", "db_model": true}',
    )

    # Mock proxy_config.decrypt_model_list_from_db
    mock_decrypt = MagicMock(return_value=[{"model_name": "db-gemini-pro", "model_info": {"id": "db-model-2", "db_model": True}}])

    monkeypatch.setattr(proxy_config, "decrypt_model_list_from_db", mock_decrypt)

    # Test Case 1: No search term - should return all models unchanged
    result_models, total_count = await _apply_search_filter_to_models(
        all_models=mock_models.copy(),
        search="",
        page=1,
        size=50,
        prisma_client=mock_prisma_client,
        proxy_config=proxy_config,
    )
    assert result_models == mock_models
    assert total_count is None

    # Test Case 2: Search for "gpt" - should filter router models and query DB
    mock_db_table.count = AsyncMock(return_value=0)
    mock_db_table.find_many = AsyncMock(return_value=[])

    result_models, total_count = await _apply_search_filter_to_models(
        all_models=mock_models.copy(),
        search="gpt",
        page=1,
        size=50,
        prisma_client=mock_prisma_client,
        proxy_config=proxy_config,
    )
    assert len(result_models) == 2
    model_names = [m["model_name"] for m in result_models]
    assert "gpt-4-turbo" in model_names
    assert "db-gpt-3.5" in model_names
    assert "claude-3-opus" not in model_names
    assert total_count == 2  # Only router models match

    # Test Case 3: Search with DB models matching
    mock_db_table.count = AsyncMock(return_value=1)
    mock_db_table.find_many = AsyncMock(return_value=[mock_db_model_1])

    result_models, total_count = await _apply_search_filter_to_models(
        all_models=mock_models.copy(),
        search="gemini",
        page=1,
        size=50,
        prisma_client=mock_prisma_client,
        proxy_config=proxy_config,
    )
    assert total_count == 1  # Router models (0) + DB models (1)
    assert len(result_models) == 1
    assert result_models[0]["model_name"] == "db-gemini-pro"

    # Test Case 4: Case-insensitive search
    # Reset mocks - no DB models should match "GPT"
    mock_db_table.count = AsyncMock(return_value=0)
    mock_db_table.find_many = AsyncMock(return_value=[])

    result_models, total_count = await _apply_search_filter_to_models(
        all_models=mock_models.copy(),
        search="GPT",
        page=1,
        size=50,
        prisma_client=mock_prisma_client,
        proxy_config=proxy_config,
    )
    assert len(result_models) == 2
    model_names = [m["model_name"] for m in result_models]
    assert "gpt-4-turbo" in model_names
    assert "db-gpt-3.5" in model_names

    # Test Case 5: Database query error - should fallback to router models count
    mock_db_table.count = AsyncMock(side_effect=Exception("DB error"))
    mock_db_table.find_many = AsyncMock(return_value=[])

    result_models, total_count = await _apply_search_filter_to_models(
        all_models=mock_models.copy(),
        search="gpt",
        page=1,
        size=50,
        prisma_client=mock_prisma_client,
        proxy_config=proxy_config,
    )
    # Should still return filtered router models
    assert len(result_models) == 2
    assert total_count == 2  # Fallback to router models count


def test_paginate_models_response():
    """
    Test the _paginate_models_response helper function.
    Tests pagination calculation and response formatting.
    """
    from litellm.proxy.proxy_server import _paginate_models_response

    # Create mock models
    mock_models = [
        {"model_name": f"model-{i}", "model_info": {"id": f"model-{i}"}}
        for i in range(25)
    ]

    # Test Case 1: Basic pagination - first page
    result = _paginate_models_response(
        all_models=mock_models,
        page=1,
        size=10,
        total_count=None,
        search=None,
    )
    assert result["total_count"] == 25
    assert result["current_page"] == 1
    assert result["total_pages"] == 3  # ceil(25/10) = 3
    assert result["size"] == 10
    assert len(result["data"]) == 10
    assert result["data"][0]["model_name"] == "model-0"

    # Test Case 2: Second page
    result = _paginate_models_response(
        all_models=mock_models,
        page=2,
        size=10,
        total_count=None,
        search=None,
    )
    assert result["current_page"] == 2
    assert len(result["data"]) == 10
    assert result["data"][0]["model_name"] == "model-10"

    # Test Case 3: Last page (partial)
    result = _paginate_models_response(
        all_models=mock_models,
        page=3,
        size=10,
        total_count=None,
        search=None,
    )
    assert result["current_page"] == 3
    assert len(result["data"]) == 5  # Only 5 models left
    assert result["data"][0]["model_name"] == "model-20"

    # Test Case 4: With explicit total_count (for search scenarios)
    result = _paginate_models_response(
        all_models=mock_models[:10],  # Only 10 models in list
        page=1,
        size=10,
        total_count=50,  # But total_count says 50
        search="test",
    )
    assert result["total_count"] == 50
    assert result["total_pages"] == 5  # ceil(50/10) = 5
    assert len(result["data"]) == 10

    # Test Case 5: Empty models list
    result = _paginate_models_response(
        all_models=[],
        page=1,
        size=10,
        total_count=0,
        search=None,
    )
    assert result["total_count"] == 0
    assert result["total_pages"] == 0
    assert len(result["data"]) == 0

    # Test Case 6: Page beyond available data
    result = _paginate_models_response(
        all_models=mock_models[:10],
        page=5,
        size=10,
        total_count=10,
        search=None,
    )
    assert result["current_page"] == 5
    assert len(result["data"]) == 0  # No data for page 5


def test_enrich_model_info_with_litellm_data():
    """
    Test the _enrich_model_info_with_litellm_data helper function.
    Tests model info enrichment, debug mode, and sensitive info removal.
    """
    from unittest.mock import MagicMock, patch

    from litellm.proxy.proxy_server import _enrich_model_info_with_litellm_data

    # Test Case 1: Basic model enrichment without debug
    model = {
        "model_name": "test-model",
        "litellm_params": {"model": "gpt-3.5-turbo"},
        "model_info": {"id": "test-model"},
        "api_key": "sk-secret-key",  # Should be removed
    }

    with patch("litellm.proxy.proxy_server.get_litellm_model_info") as mock_get_info, patch(
        "litellm.proxy.proxy_server.remove_sensitive_info_from_deployment"
    ) as mock_remove_sensitive:
        mock_get_info.return_value = {
            "input_cost_per_token": 0.001,
            "output_cost_per_token": 0.002,
            "max_tokens": 4096,
        }
        mock_remove_sensitive.return_value = {
            "model_name": "test-model",
            "litellm_params": {"model": "gpt-3.5-turbo"},
            "model_info": {
                "id": "test-model",
                "input_cost_per_token": 0.001,
                "output_cost_per_token": 0.002,
                "max_tokens": 4096,
            },
        }

        result = _enrich_model_info_with_litellm_data(model=model, debug=False)

        # Verify get_litellm_model_info was called
        mock_get_info.assert_called_once_with(model=model)
        # Verify remove_sensitive_info_from_deployment was called
        mock_remove_sensitive.assert_called_once()
        # Verify result doesn't have api_key
        assert "api_key" not in result
        # Verify model_info was enriched
        assert "input_cost_per_token" in result["model_info"]

    # Test Case 2: Model enrichment with debug mode
    model_with_debug = {
        "model_name": "test-model-debug",
        "litellm_params": {"model": "gpt-4"},
        "model_info": {},
    }

    mock_router = MagicMock()
    mock_client = MagicMock()
    mock_router._get_client.return_value = mock_client

    with patch("litellm.proxy.proxy_server.get_litellm_model_info") as mock_get_info, patch(
        "litellm.proxy.proxy_server.remove_sensitive_info_from_deployment"
    ) as mock_remove_sensitive:
        mock_get_info.return_value = {}
        mock_remove_sensitive.return_value = {
            "model_name": "test-model-debug",
            "litellm_params": {"model": "gpt-4"},
            "model_info": {},
            "openai_client": str(mock_client),
        }

        result = _enrich_model_info_with_litellm_data(
            model=model_with_debug, debug=True, llm_router=mock_router
        )

        # Verify debug info was added
        mock_remove_sensitive.assert_called_once()
        call_args = mock_remove_sensitive.call_args[0][0]
        assert "openai_client" in call_args
        # Verify router._get_client was called for debug
        mock_router._get_client.assert_called_once()

    # Test Case 3: Model with fallback to litellm.get_model_info
    model_fallback = {
        "model_name": "test-model-fallback",
        "litellm_params": {"model": "claude-3-opus"},
        "model_info": {},
    }

    with patch("litellm.proxy.proxy_server.get_litellm_model_info") as mock_get_info, patch(
        "litellm.get_model_info"
    ) as mock_litellm_info, patch(
        "litellm.proxy.proxy_server.remove_sensitive_info_from_deployment"
    ) as mock_remove_sensitive:
        # First call returns empty, triggering fallback
        mock_get_info.return_value = {}
        mock_litellm_info.return_value = {
            "input_cost_per_token": 0.015,
            "output_cost_per_token": 0.075,
            "max_tokens": 200000,
        }
        mock_remove_sensitive.return_value = {
            "model_name": "test-model-fallback",
            "litellm_params": {"model": "claude-3-opus"},
            "model_info": {
                "input_cost_per_token": 0.015,
                "output_cost_per_token": 0.075,
                "max_tokens": 200000,
            },
        }

        result = _enrich_model_info_with_litellm_data(model=model_fallback, debug=False)

        # Verify fallback was attempted
        mock_litellm_info.assert_called_once_with(model="claude-3-opus")
        # Verify model_info was enriched with fallback data
        call_args = mock_remove_sensitive.call_args[0][0]
        assert call_args["model_info"]["input_cost_per_token"] == 0.015

    # Test Case 4: Model with split model name fallback
    model_split = {
        "model_name": "test-model-split",
        "litellm_params": {"model": "azure/gpt-4"},
        "model_info": {},
    }

    with patch("litellm.proxy.proxy_server.get_litellm_model_info") as mock_get_info, patch(
        "litellm.get_model_info"
    ) as mock_litellm_info, patch(
        "litellm.proxy.proxy_server.remove_sensitive_info_from_deployment"
    ) as mock_remove_sensitive:
        # Both first and second pass return empty, triggering third pass
        mock_get_info.return_value = {}
        # Second pass (no split)
        mock_litellm_info.side_effect = [
            {},  # First call returns empty
            {"max_tokens": 8192},  # Third pass with split succeeds
        ]
        mock_remove_sensitive.return_value = {
            "model_name": "test-model-split",
            "litellm_params": {"model": "azure/gpt-4"},
            "model_info": {"max_tokens": 8192},
        }

        result = _enrich_model_info_with_litellm_data(model=model_split, debug=False)

        # Verify third pass was attempted with split model name
        assert mock_litellm_info.call_count == 2
        # Check that second call used split model name
        second_call = mock_litellm_info.call_args_list[1]
        assert second_call[1]["model"] == "gpt-4"
        assert second_call[1]["custom_llm_provider"] == "azure"

    # Test Case 5: Model with existing model_info (should preserve existing keys)
    model_existing = {
        "model_name": "test-model-existing",
        "litellm_params": {"model": "gpt-3.5-turbo"},
        "model_info": {"id": "existing-id", "custom_key": "custom_value"},
    }

    with patch("litellm.proxy.proxy_server.get_litellm_model_info") as mock_get_info, patch(
        "litellm.proxy.proxy_server.remove_sensitive_info_from_deployment"
    ) as mock_remove_sensitive:
        mock_get_info.return_value = {
            "input_cost_per_token": 0.001,
            "id": "new-id",  # Should not override existing "id"
        }
        mock_remove_sensitive.return_value = {
            "model_name": "test-model-existing",
            "litellm_params": {"model": "gpt-3.5-turbo"},
            "model_info": {
                "id": "existing-id",  # Existing key preserved
                "custom_key": "custom_value",  # Existing key preserved
                "input_cost_per_token": 0.001,  # New key added
            },
        }

        result = _enrich_model_info_with_litellm_data(model=model_existing, debug=False)

        # Verify existing keys are preserved
        call_args = mock_remove_sensitive.call_args[0][0]
        assert call_args["model_info"]["id"] == "existing-id"
        assert call_args["model_info"]["custom_key"] == "custom_value"
        assert call_args["model_info"]["input_cost_per_token"] == 0.001


@pytest.mark.asyncio
async def test_model_list_scope_parameter_validation(monkeypatch):
    """Test that invalid scope parameter raises HTTPException"""
    from fastapi import HTTPException

    from litellm.proxy._types import LitellmUserRoles, UserAPIKeyAuth
    from litellm.proxy.proxy_server import model_list

    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="test-user",
        user_role=LitellmUserRoles.INTERNAL_USER,
        api_key="test-key",
    )

    # Test invalid scope parameter
    with pytest.raises(HTTPException) as exc_info:
        await model_list(
            user_api_key_dict=mock_user_api_key_dict,
            scope="invalid_scope",
        )

    assert exc_info.value.status_code == 400
    assert "Invalid scope parameter" in exc_info.value.detail
    assert "Only 'expand' is currently supported" in exc_info.value.detail


@pytest.mark.asyncio
async def test_model_list_scope_expand_proxy_admin(monkeypatch):
    """Test that proxy admin with scope=expand returns all proxy models"""
    from litellm.proxy._types import LiteLLM_UserTable, LitellmUserRoles, UserAPIKeyAuth
    from litellm.proxy.proxy_server import model_list

    # Mock user API key dict for proxy admin
    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="proxy-admin-user",
        user_role=LitellmUserRoles.PROXY_ADMIN,
        api_key="test-key",
    )

    # Mock llm_router with proxy models
    mock_router = MagicMock()
    mock_router.get_model_names.return_value = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]
    mock_router.get_model_access_groups.return_value = {}

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock user_api_key_cache
    mock_user_api_key_cache = MagicMock()

    # Mock proxy_logging_obj
    mock_proxy_logging_obj = MagicMock()

    # Mock get_complete_model_list
    mock_all_models = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]

    # Mock create_model_info_response
    def mock_create_model_info_response(model_id, provider, include_metadata=False, fallback_type=None, llm_router=None):
        return {"id": model_id, "object": "model"}

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_api_key_cache", mock_user_api_key_cache)
    monkeypatch.setattr("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj)
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(
        "litellm.proxy.auth.model_checks.get_complete_model_list",
        lambda **kwargs: mock_all_models,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.create_model_info_response",
        mock_create_model_info_response,
    )

    # Call model_list with scope=expand
    result = await model_list(
        user_api_key_dict=mock_user_api_key_dict,
        scope="expand",
    )

    # Verify result contains all proxy models
    assert result["object"] == "list"
    assert len(result["data"]) == 3
    assert all(model["id"] in mock_all_models for model in result["data"])

    # Verify router methods were called
    mock_router.get_model_names.assert_called_once()
    mock_router.get_model_access_groups.assert_called_once()


@pytest.mark.asyncio
async def test_model_list_scope_expand_org_admin(monkeypatch):
    """Test that org admin with scope=expand returns all proxy models"""
    from litellm.proxy._types import (
        LiteLLM_UserTable,
        LitellmUserRoles,
        UserAPIKeyAuth,
    )
    from litellm.proxy.proxy_server import model_list

    # Mock user API key dict for org admin
    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="org-admin-user",
        user_role=LitellmUserRoles.INTERNAL_USER,  # Not proxy admin, but org admin
        api_key="test-key",
    )

    # Mock user object with org admin membership
    from datetime import datetime

    from litellm.proxy._types import LiteLLM_OrganizationMembershipTable

    mock_user_obj = LiteLLM_UserTable(
        user_id="org-admin-user",
        user_email="org-admin@example.com",
        organization_memberships=[
            LiteLLM_OrganizationMembershipTable(
                user_id="org-admin-user",
                organization_id="org-123",
                user_role=LitellmUserRoles.ORG_ADMIN.value,
                spend=0.0,
                created_at=datetime.now(),
                updated_at=datetime.now(),
            )
        ],
        teams=[],
    )

    # Mock llm_router with proxy models
    mock_router = MagicMock()
    mock_router.get_model_names.return_value = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]
    mock_router.get_model_access_groups.return_value = {}

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock user_api_key_cache
    mock_user_api_key_cache = MagicMock()

    # Mock proxy_logging_obj
    mock_proxy_logging_obj = MagicMock()

    # Mock get_user_object to return user with org admin role
    async def mock_get_user_object(*args, **kwargs):
        return mock_user_obj

    # Mock get_complete_model_list
    mock_all_models = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]

    # Mock create_model_info_response
    def mock_create_model_info_response(model_id, provider, include_metadata=False, fallback_type=None, llm_router=None):
        return {"id": model_id, "object": "model"}

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_api_key_cache", mock_user_api_key_cache)
    monkeypatch.setattr("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj)
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(
        "litellm.proxy.auth.auth_checks.get_user_object",
        mock_get_user_object,
    )
    monkeypatch.setattr(
        "litellm.proxy.auth.model_checks.get_complete_model_list",
        lambda **kwargs: mock_all_models,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.create_model_info_response",
        mock_create_model_info_response,
    )

    # Call model_list with scope=expand
    result = await model_list(
        user_api_key_dict=mock_user_api_key_dict,
        scope="expand",
    )

    # Verify result contains all proxy models
    assert result["object"] == "list"
    assert len(result["data"]) == 3
    assert all(model["id"] in mock_all_models for model in result["data"])

    # Verify router methods were called
    mock_router.get_model_names.assert_called_once()
    mock_router.get_model_access_groups.assert_called_once()


@pytest.mark.asyncio
async def test_model_list_scope_expand_team_admin(monkeypatch):
    """Test that team admin with scope=expand returns all proxy models"""
    from litellm.proxy._types import (
        LiteLLM_TeamTable,
        LiteLLM_UserTable,
        LitellmUserRoles,
        UserAPIKeyAuth,
    )
    from litellm.proxy.proxy_server import model_list

    # Mock user API key dict for team admin
    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="team-admin-user",
        user_role=LitellmUserRoles.INTERNAL_USER,  # Not proxy admin, but team admin
        api_key="test-key",
    )

    # Mock team with user as admin - use dict structure that matches Prisma return
    mock_team = MagicMock()
    mock_team.model_dump.return_value = {
        "team_id": "team-123",
        "members_with_roles": [
            {"user_id": "team-admin-user", "role": "admin"}
        ],
    }
    # Create team object from the dict (validator will convert members_with_roles to Member objects)
    mock_team_obj = LiteLLM_TeamTable(**mock_team.model_dump())

    # Mock user object with team membership
    mock_user_obj = LiteLLM_UserTable(
        user_id="team-admin-user",
        user_email="team-admin@example.com",
        organization_memberships=[],
        teams=["team-123"],
    )

    # Mock llm_router with proxy models
    mock_router = MagicMock()
    mock_router.get_model_names.return_value = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]
    mock_router.get_model_access_groups.return_value = {}

    # Mock prisma_client
    mock_prisma_client = MagicMock()
    mock_prisma_client.db.litellm_teamtable.find_many = AsyncMock(
        return_value=[mock_team]
    )

    # Mock user_api_key_cache
    mock_user_api_key_cache = MagicMock()

    # Mock proxy_logging_obj
    mock_proxy_logging_obj = MagicMock()

    # Mock get_user_object to return user with team membership
    async def mock_get_user_object(*args, **kwargs):
        return mock_user_obj

    # Mock get_complete_model_list
    mock_all_models = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]

    # Mock create_model_info_response
    def mock_create_model_info_response(model_id, provider, include_metadata=False, fallback_type=None, llm_router=None):
        return {"id": model_id, "object": "model"}

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_api_key_cache", mock_user_api_key_cache)
    monkeypatch.setattr("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj)
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(
        "litellm.proxy.auth.auth_checks.get_user_object",
        mock_get_user_object,
    )
    monkeypatch.setattr(
        "litellm.proxy.auth.model_checks.get_complete_model_list",
        lambda **kwargs: mock_all_models,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.create_model_info_response",
        mock_create_model_info_response,
    )

    # Call model_list with scope=expand
    result = await model_list(
        user_api_key_dict=mock_user_api_key_dict,
        scope="expand",
    )

    # Verify result contains all proxy models
    assert result["object"] == "list"
    assert len(result["data"]) == 3
    assert all(model["id"] in mock_all_models for model in result["data"])

    # Verify router methods were called
    mock_router.get_model_names.assert_called_once()
    mock_router.get_model_access_groups.assert_called_once()


@pytest.mark.asyncio
async def test_model_list_scope_expand_normal_user(monkeypatch):
    """Test that normal internal user with scope=expand returns only their models (not expanded)"""
    from litellm.proxy._types import LiteLLM_UserTable, LitellmUserRoles, UserAPIKeyAuth
    from litellm.proxy.proxy_server import model_list

    # Mock user API key dict for normal internal user
    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="normal-user",
        user_role=LitellmUserRoles.INTERNAL_USER,
        api_key="test-key",
        models=["gpt-3.5-turbo"],  # User only has access to this model
    )

    # Mock user object without admin privileges
    mock_user_obj = LiteLLM_UserTable(
        user_id="normal-user",
        user_email="normal@example.com",
        organization_memberships=[],  # No org admin
        teams=[],  # No teams
    )

    # Mock llm_router
    mock_router = MagicMock()
    mock_router.get_model_names.return_value = ["gpt-4", "gpt-3.5-turbo", "claude-3-opus"]

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock user_api_key_cache
    mock_user_api_key_cache = MagicMock()

    # Mock proxy_logging_obj
    mock_proxy_logging_obj = MagicMock()

    # Mock get_user_object to return user without admin privileges
    async def mock_get_user_object(*args, **kwargs):
        return mock_user_obj

    # Mock get_available_models_for_user to return only user's models
    async def mock_get_available_models_for_user(*args, **kwargs):
        return ["gpt-3.5-turbo"]  # Only user's accessible models

    # Mock create_model_info_response
    def mock_create_model_info_response(model_id, provider, include_metadata=False, fallback_type=None, llm_router=None):
        return {"id": model_id, "object": "model"}

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_api_key_cache", mock_user_api_key_cache)
    monkeypatch.setattr("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj)
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(
        "litellm.proxy.auth.auth_checks.get_user_object",
        mock_get_user_object,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.get_available_models_for_user",
        mock_get_available_models_for_user,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.create_model_info_response",
        mock_create_model_info_response,
    )

    # Call model_list with scope=expand
    result = await model_list(
        user_api_key_dict=mock_user_api_key_dict,
        scope="expand",
    )

    # Verify result contains only user's models (not all proxy models)
    assert result["object"] == "list"
    assert len(result["data"]) == 1
    assert result["data"][0]["id"] == "gpt-3.5-turbo"

    # Verify router methods were NOT called (normal path, not expanded)
    mock_router.get_model_names.assert_not_called()
    mock_router.get_model_access_groups.assert_not_called()


@pytest.mark.asyncio
async def test_model_list_no_scope_parameter(monkeypatch):
    """Test that model_list without scope parameter uses normal behavior"""
    from litellm.proxy._types import LitellmUserRoles, UserAPIKeyAuth
    from litellm.proxy.proxy_server import model_list

    # Mock user API key dict
    mock_user_api_key_dict = UserAPIKeyAuth(
        user_id="test-user",
        user_role=LitellmUserRoles.INTERNAL_USER,
        api_key="test-key",
        models=["gpt-3.5-turbo"],
    )

    # Mock llm_router
    mock_router = MagicMock()

    # Mock prisma_client
    mock_prisma_client = MagicMock()

    # Mock user_api_key_cache
    mock_user_api_key_cache = MagicMock()

    # Mock proxy_logging_obj
    mock_proxy_logging_obj = MagicMock()

    # Mock get_available_models_for_user
    async def mock_get_available_models_for_user(*args, **kwargs):
        return ["gpt-3.5-turbo"]

    # Mock create_model_info_response
    def mock_create_model_info_response(model_id, provider, include_metadata=False, fallback_type=None, llm_router=None):
        return {"id": model_id, "object": "model"}

    # Apply monkeypatches
    monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router)
    monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client)
    monkeypatch.setattr("litellm.proxy.proxy_server.user_api_key_cache", mock_user_api_key_cache)
    monkeypatch.setattr("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj)
    monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {})
    monkeypatch.setattr("litellm.proxy.proxy_server.user_model", None)
    monkeypatch.setattr(
        "litellm.proxy.utils.get_available_models_for_user",
        mock_get_available_models_for_user,
    )
    monkeypatch.setattr(
        "litellm.proxy.utils.create_model_info_response",
        mock_create_model_info_response,
    )

    # Call model_list without scope parameter
    result = await model_list(
        user_api_key_dict=mock_user_api_key_dict,
        scope=None,
    )

    # Verify result uses normal behavior
    assert result["object"] == "list"
    assert len(result["data"]) == 1
    assert result["data"][0]["id"] == "gpt-3.5-turbo"

    # Verify router methods were NOT called (normal path)
    mock_router.get_model_names.assert_not_called()
    mock_router.get_model_access_groups.assert_not_called()


@pytest.mark.asyncio
async def test_update_general_settings_store_prompts_in_spend_logs(monkeypatch):
    """
    Test that _update_general_settings correctly normalizes store_prompts_in_spend_logs
    values (handles bool, string, None, and other types).
    """
    from unittest.mock import patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: None value
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": None}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is None

    # Test Case 2: bool True
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": True}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is True

    # Test Case 3: bool False
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": False}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False

    # Test Case 4: string "true" (lowercase)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "true"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is True

    # Test Case 5: string "True" (capitalized)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "True"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is True

    # Test Case 6: string "TRUE" (uppercase)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "TRUE"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is True

    # Test Case 7: string "false" (lowercase)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "false"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False

    # Test Case 8: string "False" (capitalized)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "False"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False

    # Test Case 9: string "FALSE" (uppercase)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "FALSE"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False

    # Test Case 10: other string value (should be False)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": "invalid"}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False

    # Test Case 11: integer 1 (should be True)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": 1}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is True

    # Test Case 12: integer 0 (should be False)
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs):
        await proxy_config._update_general_settings(
            {"store_prompts_in_spend_logs": 0}
        )
        assert mock_gs.get("store_prompts_in_spend_logs") is False


@pytest.mark.asyncio
async def test_update_general_settings_maximum_spend_logs_retention_period(monkeypatch):
    """
    Test that _update_general_settings correctly handles maximum_spend_logs_retention_period
    and reschedules cleanup job when value changes.
    """
    from unittest.mock import AsyncMock, patch

    from litellm.proxy.proxy_server import ProxyConfig

    proxy_config = ProxyConfig()

    # Test Case 1: Setting a new value should reschedule cleanup job
    mock_reschedule = AsyncMock()
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": "7d"}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") == "7d"
        mock_reschedule.assert_called_once()

    # Test Case 2: Setting the same value should not reschedule
    mock_reschedule.reset_mock()
    mock_gs = {"maximum_spend_logs_retention_period": "7d"}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": "7d"}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") == "7d"
        mock_reschedule.assert_not_called()

    # Test Case 3: Changing value should reschedule
    mock_reschedule.reset_mock()
    mock_gs = {"maximum_spend_logs_retention_period": "7d"}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": "30d"}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") == "30d"
        mock_reschedule.assert_called_once()

    # Test Case 4: Setting to None should reschedule
    mock_reschedule.reset_mock()
    mock_gs = {"maximum_spend_logs_retention_period": "7d"}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": None}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") is None
        mock_reschedule.assert_called_once()

    # Test Case 5: Changing from None to a value should reschedule
    mock_reschedule.reset_mock()
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": "24h"}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") == "24h"
        mock_reschedule.assert_called_once()

    # Test Case 6: Setting None when already None should not reschedule
    mock_reschedule.reset_mock()
    mock_gs = {}
    with patch("litellm.proxy.proxy_server.general_settings", mock_gs), patch.object(
        proxy_config, "_reschedule_spend_log_cleanup_job", mock_reschedule
    ):
        await proxy_config._update_general_settings(
            {"maximum_spend_logs_retention_period": None}
        )
        assert mock_gs.get("maximum_spend_logs_retention_period") is None
        mock_reschedule.assert_not_called()