import asyncio import importlib import json import os import socket import subprocess import sys from datetime import datetime, timezone from pathlib import Path from unittest import mock from unittest.mock import AsyncMock, MagicMock, mock_open, patch import click import httpx import pytest import yaml from fastapi import FastAPI from fastapi.staticfiles import StaticFiles from fastapi.testclient import TestClient sys.path.insert( 0, os.path.abspath("../../..") ) # Adds the parent directory to the system-path import litellm from litellm.proxy.auth.user_api_key_auth import user_api_key_auth from litellm.proxy.proxy_server import app, initialize from litellm.utils import _invalidate_model_cost_lowercase_map example_embedding_result = { "object": "list", "data": [ { "object": "embedding", "index": 0, "embedding": [ -0.006929283495992422, -0.005336422007530928, -4.547132266452536e-05, -0.024047505110502243, -0.006929283495992422, -0.005336422007530928, -4.547132266452536e-05, -0.024047505110502243, -0.006929283495992422, -0.005336422007530928, -4.547132266452536e-05, -0.024047505110502243, ], } ], "model": "text-embedding-3-small", "usage": {"prompt_tokens": 5, "total_tokens": 5}, } def mock_patch_aembedding(): return mock.patch( "litellm.proxy.proxy_server.llm_router.aembedding", return_value=example_embedding_result, ) @pytest.fixture(scope="function") def client_no_auth(): # Assuming litellm.proxy.proxy_server is an object from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" # initialize can get run in parallel, it sets specific variables for the fast api app, sinc eit gets run in parallel different tests use the wrong variables asyncio.run(initialize(config=config_fp, debug=True)) return TestClient(app) def test_login_v2_returns_redirect_url_and_sets_cookie(monkeypatch): mock_login_result = {"user_id": "test-user"} mock_prisma_client = MagicMock() mock_authenticate_user = AsyncMock(return_value=mock_login_result) mock_create_ui_token_object = MagicMock(return_value={"user_id": "test-user"}) mock_jwt_encode = MagicMock(return_value="signed-token") monkeypatch.setattr( "litellm.proxy.auth.login_utils.authenticate_user", mock_authenticate_user, ) monkeypatch.setattr( "litellm.proxy.auth.login_utils.create_ui_token_object", mock_create_ui_token_object, ) monkeypatch.setattr("jwt.encode", mock_jwt_encode) monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key") monkeypatch.setattr("litellm.proxy.proxy_server.general_settings", {}) monkeypatch.setattr("litellm.proxy.proxy_server.premium_user", False) monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client) monkeypatch.setattr("litellm.proxy.utils.get_server_root_path", lambda: "") monkeypatch.setattr("litellm.proxy.utils.get_proxy_base_url", lambda: None) client = TestClient(app) response = client.post( "/v2/login", json={"username": "alice", "password": "secret"}, ) assert response.status_code == 200 assert ( response.json() == {"redirect_url": "http://testserver/ui/?login=success"} ) assert response.cookies.get("token") == "signed-token" mock_authenticate_user.assert_awaited_once_with( username="alice", password="secret", master_key="test-master-key", prisma_client=mock_prisma_client, ) mock_create_ui_token_object.assert_called_once_with( login_result=mock_login_result, general_settings={}, premium_user=False, ) mock_jwt_encode.assert_called_once_with( {"user_id": "test-user"}, "test-master-key", algorithm="HS256", ) def test_login_v2_returns_json_on_proxy_exception(monkeypatch): """Test that /v2/login returns JSON error when ProxyException is raised""" from litellm.proxy._types import ProxyErrorTypes, ProxyException mock_prisma_client = MagicMock() mock_authenticate_user = AsyncMock( side_effect=ProxyException( message="Invalid credentials", type=ProxyErrorTypes.auth_error, param="password", code=401, ) ) monkeypatch.setattr( "litellm.proxy.auth.login_utils.authenticate_user", mock_authenticate_user, ) monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key") monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client) client = TestClient(app) response = client.post( "/v2/login", json={"username": "alice", "password": "wrong"}, ) assert response.status_code == 401 assert response.headers["content-type"] == "application/json" data = response.json() assert "error" in data assert data["error"]["message"] == "Invalid credentials" assert data["error"]["type"] == "auth_error" def test_login_v2_returns_json_on_http_exception(monkeypatch): """Test that /v2/login converts HTTPException to JSON error response""" from fastapi import HTTPException mock_prisma_client = MagicMock() mock_authenticate_user = AsyncMock( side_effect=HTTPException(status_code=401, detail="Unauthorized") ) monkeypatch.setattr( "litellm.proxy.auth.login_utils.authenticate_user", mock_authenticate_user, ) monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key") monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client) client = TestClient(app) response = client.post( "/v2/login", json={"username": "alice", "password": "secret"}, ) assert response.status_code == 401 assert response.headers["content-type"] == "application/json" data = response.json() assert "error" in data assert isinstance(data["error"], dict) def test_login_v2_returns_json_on_unexpected_exception(monkeypatch): """Test that /v2/login returns JSON error when unexpected exception occurs""" mock_prisma_client = MagicMock() mock_authenticate_user = AsyncMock(side_effect=ValueError("Unexpected error")) monkeypatch.setattr( "litellm.proxy.auth.login_utils.authenticate_user", mock_authenticate_user, ) monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key") monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client) client = TestClient(app) response = client.post( "/v2/login", json={"username": "alice", "password": "secret"}, ) assert response.status_code == 500 assert response.headers["content-type"] == "application/json" data = response.json() assert "error" in data assert isinstance(data["error"], dict) assert "Unexpected error" in data["error"]["message"] def test_login_v2_returns_json_on_invalid_json_body(monkeypatch): """Test that /v2/login returns JSON error when request body is invalid JSON""" monkeypatch.setattr("litellm.proxy.proxy_server.master_key", "test-master-key") client = TestClient(app) response = client.post( "/v2/login", content="invalid json", headers={"Content-Type": "application/json"}, ) assert response.status_code == 500 assert response.headers["content-type"] == "application/json" data = response.json() assert "error" in data assert isinstance(data["error"], dict) def test_fallback_login_has_no_deprecation_banner(client_no_auth): response = client_no_auth.get("/fallback/login") assert response.status_code == 200 html = response.text assert '
' not in html assert "Deprecated:" not in html assert "' in html assert "Deprecated:" in html def test_restructure_ui_html_files_handles_nested_routes(tmp_path): """ Test that _restructure_ui_html_files correctly restructures HTML files. Note: This function is always called now, both in development and non-root Docker environments. """ from litellm.proxy import proxy_server ui_root = tmp_path / "ui" ui_root.mkdir() def write_file(path: Path, content: str) -> None: path.parent.mkdir(parents=True, exist_ok=True) path.write_text(content) write_file(ui_root / "home.html", "home") write_file(ui_root / "mcp" / "oauth" / "callback.html", "callback") write_file(ui_root / "existing" / "index.html", "keep") write_file(ui_root / "_next" / "ignore.html", "asset") write_file(ui_root / "litellm-asset-prefix" / "ignore.html", "asset") proxy_server._restructure_ui_html_files(str(ui_root)) assert not (ui_root / "home.html").exists() assert (ui_root / "home" / "index.html").read_text() == "home" assert not (ui_root / "mcp" / "oauth" / "callback.html").exists() assert ( (ui_root / "mcp" / "oauth" / "callback" / "index.html").read_text() == "callback" ) assert (ui_root / "existing" / "index.html").read_text() == "keep" assert (ui_root / "_next" / "ignore.html").read_text() == "asset" assert ( (ui_root / "litellm-asset-prefix" / "ignore.html").read_text() == "asset" ) def test_ui_extensionless_route_requires_restructure(tmp_path): """ Regression for non-root fallback: /ui/login expects login/index.html. Note: Restructuring always happens now, both in development and non-root Docker environments. """ from litellm.proxy import proxy_server ui_root = tmp_path / "ui" ui_root.mkdir() (ui_root / "index.html").write_text("index") (ui_root / "login.html").write_text("login") fastapi_app = FastAPI() fastapi_app.mount( "/ui", StaticFiles(directory=str(ui_root), html=True), name="ui" ) client = TestClient(fastapi_app) assert client.get("/ui/login.html").status_code == 200 assert client.get("/ui/login").status_code == 404 proxy_server._restructure_ui_html_files(str(ui_root)) response = client.get("/ui/login") assert response.status_code == 200 assert "login" in response.text def test_restructure_always_happens(monkeypatch): """ Test that restructuring logic always executes regardless of LITELLM_NON_ROOT setting. In development (is_non_root=False), restructuring happens directly in _experimental/out. In non-root Docker (is_non_root=True), restructuring happens in /var/lib/litellm/ui. """ # Test Case 1: is_non_root is True - restructuring happens in /var/lib/litellm/ui monkeypatch.setenv("LITELLM_NON_ROOT", "true") runtime_ui_path = "/var/lib/litellm/ui" packaged_ui_path = "/some/packaged/ui/path" # Simulate the logic from proxy_server.py is_non_root = os.getenv("LITELLM_NON_ROOT", "").lower() == "true" if is_non_root: ui_path = runtime_ui_path else: ui_path = packaged_ui_path # Restructuring always happens now, regardless of ui_path vs packaged_ui_path should_restructure = True assert is_non_root is True assert should_restructure is True assert ui_path == runtime_ui_path # Test Case 2: is_non_root is False - restructuring happens directly in packaged_ui_path monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) # Simulate the logic from proxy_server.py is_non_root = os.getenv("LITELLM_NON_ROOT", "").lower() == "true" if is_non_root: ui_path = runtime_ui_path else: ui_path = packaged_ui_path # Restructuring always happens now, even when ui_path == packaged_ui_path should_restructure = True assert is_non_root is False assert should_restructure is True assert ui_path == packaged_ui_path @pytest.mark.asyncio async def test_initialize_scheduled_jobs_credentials(monkeypatch): """ Test that get_credentials is only called when store_model_in_db is True """ monkeypatch.delenv("DISABLE_PRISMA_SCHEMA_UPDATE", raising=False) monkeypatch.delenv("STORE_MODEL_IN_DB", raising=False) from litellm.proxy.proxy_server import ProxyStartupEvent from litellm.proxy.utils import ProxyLogging # Mock dependencies mock_prisma_client = MagicMock() mock_proxy_logging = MagicMock(spec=ProxyLogging) mock_proxy_logging.slack_alerting_instance = MagicMock() mock_proxy_config = AsyncMock() with patch("litellm.proxy.proxy_server.proxy_config", mock_proxy_config), patch( "litellm.proxy.proxy_server.store_model_in_db", False ): # set store_model_in_db to False # Test when store_model_in_db is False await ProxyStartupEvent.initialize_scheduled_background_jobs( general_settings={}, prisma_client=mock_prisma_client, proxy_budget_rescheduler_min_time=1, proxy_budget_rescheduler_max_time=2, proxy_batch_write_at=5, proxy_logging_obj=mock_proxy_logging, ) # Verify get_credentials was not called mock_proxy_config.get_credentials.assert_not_called() # Now test with store_model_in_db = True with patch("litellm.proxy.proxy_server.proxy_config", mock_proxy_config), patch( "litellm.proxy.proxy_server.store_model_in_db", True ), patch("litellm.proxy.proxy_server.get_secret_bool", return_value=True): await ProxyStartupEvent.initialize_scheduled_background_jobs( general_settings={}, prisma_client=mock_prisma_client, proxy_budget_rescheduler_min_time=1, proxy_budget_rescheduler_max_time=2, proxy_batch_write_at=5, proxy_logging_obj=mock_proxy_logging, ) # Verify get_credentials was called both directly and scheduled assert mock_proxy_config.get_credentials.call_count == 1 # Direct call # Verify a scheduled job was added for get_credentials mock_scheduler_calls = [ call[0] for call in mock_proxy_config.get_credentials.mock_calls ] assert len(mock_scheduler_calls) > 0 def test_update_config_fields_deep_merge_db_wins(): from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() current_config = { "router_settings": { "routing_mode": "cost_optimized", "model_group_alias": { # Existing alias with older model + different hidden flag "claude-sonnet-4": { "model": "claude-sonnet-4-20240219", "hidden": True, }, # An extra alias that should remain untouched unless DB overrides it "legacy-sonnet": { "model": "claude-2.1", "hidden": True, }, }, } } db_param_value = { "model_group_alias": { # Conflict: DB should win (both 'model' and 'hidden') "claude-sonnet-4": { "model": "claude-sonnet-4-20250514", "hidden": False, }, # New alias to be added by the merge "claude-sonnet-latest": { "model": "claude-sonnet-4-20250514", "hidden": True, }, # Demonstrate that None values from DB are skipped (preserve existing) "legacy-sonnet": { "hidden": None # should not clobber current True }, } } updated = proxy_config._update_config_fields( current_config=current_config, param_name="router_settings", db_param_value=db_param_value, ) rs = updated["router_settings"] aliases = rs["model_group_alias"] # DB wins on conflicts (deep) for existing alias assert aliases["claude-sonnet-4"]["model"] == "claude-sonnet-4-20250514" assert aliases["claude-sonnet-4"]["hidden"] is False # New alias introduced by DB is present with its values assert "claude-sonnet-latest" in aliases assert aliases["claude-sonnet-latest"]["model"] == "claude-sonnet-4-20250514" assert aliases["claude-sonnet-latest"]["hidden"] is True # None in DB does not overwrite existing values assert aliases["legacy-sonnet"]["model"] == "claude-2.1" assert aliases["legacy-sonnet"]["hidden"] is True # Unrelated router_settings keys are preserved assert rs["routing_mode"] == "cost_optimized" def test_get_config_custom_callback_api_env_vars(monkeypatch): """ Ensure /get/config/callbacks returns custom callback env vars when both custom values are provided. """ from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth # Mock config with custom_callback_api enabled and generic logger env vars present config_data = { "litellm_settings": {"success_callback": ["custom_callback_api"]}, "general_settings": {}, "environment_variables": { "GENERIC_LOGGER_ENDPOINT": "https://callback.example.com", "GENERIC_LOGGER_HEADERS": "Auth: token", }, } # Mock proxy_config.get_config and router settings mock_router = MagicMock() mock_router.get_settings.return_value = {} monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router) monkeypatch.setattr( proxy_config, "get_config", AsyncMock(return_value=config_data) ) # Bypass auth dependency original_overrides = app.dependency_overrides.copy() app.dependency_overrides[user_api_key_auth] = lambda: MagicMock() client = TestClient(app) try: response = client.get("/get/config/callbacks") finally: app.dependency_overrides = original_overrides assert response.status_code == 200 callbacks = response.json()["callbacks"] custom_cb = next( (cb for cb in callbacks if cb["name"] == "custom_callback_api"), None ) assert custom_cb is not None assert custom_cb["variables"] == { "GENERIC_LOGGER_ENDPOINT": "https://callback.example.com", "GENERIC_LOGGER_HEADERS": "Auth: token", } # Mock Prisma class MockPrisma: def __init__(self, database_url=None, proxy_logging_obj=None, http_client=None): self.database_url = database_url self.proxy_logging_obj = proxy_logging_obj self.http_client = http_client async def connect(self): pass async def disconnect(self): pass mock_prisma = MockPrisma() @patch( "litellm.proxy.proxy_server.ProxyStartupEvent._setup_prisma_client", return_value=mock_prisma, ) @pytest.mark.asyncio async def test_aaaproxy_startup_master_key(mock_prisma, monkeypatch, tmp_path): """ Test that master_key is correctly loaded from either config.yaml or environment variables """ import yaml from fastapi import FastAPI # Import happens here - this is when the module probably reads the config path from litellm.proxy.proxy_server import proxy_startup_event # Mock the Prisma import monkeypatch.setattr("litellm.proxy.proxy_server.PrismaClient", MockPrisma) # Create test app app = FastAPI() # Test Case 1: Master key from config.yaml test_master_key = "sk-12345" test_config = {"general_settings": {"master_key": test_master_key}} # Create a temporary config file config_path = tmp_path / "config.yaml" with open(config_path, "w") as f: yaml.dump(test_config, f) print(f"SET ENV VARIABLE - CONFIG_FILE_PATH, str(config_path): {str(config_path)}") # Second setting of CONFIG_FILE_PATH to a different value monkeypatch.setenv("CONFIG_FILE_PATH", str(config_path)) print(f"config_path: {config_path}") print(f"os.getenv('CONFIG_FILE_PATH'): {os.getenv('CONFIG_FILE_PATH')}") async with proxy_startup_event(app): from litellm.proxy.proxy_server import master_key assert master_key == test_master_key # Test Case 2: Master key from environment variable test_env_master_key = "sk-test-67890" # Create empty config empty_config = {"general_settings": {}} with open(config_path, "w") as f: yaml.dump(empty_config, f) monkeypatch.setenv("LITELLM_MASTER_KEY", test_env_master_key) print("test_env_master_key: {}".format(test_env_master_key)) async with proxy_startup_event(app): from litellm.proxy.proxy_server import master_key assert master_key == test_env_master_key # Test Case 3: Master key with os.environ prefix test_resolved_key = "sk-resolved-key" test_config_with_prefix = { "general_settings": {"master_key": "os.environ/CUSTOM_MASTER_KEY"} } # Create config with os.environ prefix with open(config_path, "w") as f: yaml.dump(test_config_with_prefix, f) monkeypatch.setenv("CUSTOM_MASTER_KEY", test_resolved_key) async with proxy_startup_event(app): from litellm.proxy.proxy_server import master_key assert master_key == test_resolved_key def test_team_info_masking(): """ Test that sensitive team information is properly masked Ref: https://huntr.com/bounties/661b388a-44d8-4ad5-862b-4dc5b80be30a """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test team object with sensitive data team1_info = { "success_callback": "['langfuse', 's3']", "langfuse_secret": "secret-test-key", "langfuse_public_key": "public-test-key", } with pytest.raises(Exception) as exc_info: proxy_config._get_team_config( team_id="test_dev", all_teams_config=[team1_info], ) print("Got exception: {}".format(exc_info.value)) assert "secret-test-key" not in str(exc_info.value) assert "public-test-key" not in str(exc_info.value) def test_embedding_input_array_of_tokens(client_no_auth): """ Test to bypass decoding input as array of tokens for selected providers Ref: https://github.com/BerriAI/litellm/issues/10113 """ from litellm.proxy import proxy_server # The client_no_auth fixture should initialize the router # Assert this to catch any router initialization regressions assert proxy_server.llm_router is not None, ( "llm_router is None after client_no_auth fixture initialized. " "This indicates a router initialization issue that should be investigated." ) try: with mock.patch.object( proxy_server.llm_router, "aembedding", return_value=example_embedding_result, ) as mock_aembedding: test_data = { "model": "vllm_embed_model", "input": [[2046, 13269, 158208]], } response = client_no_auth.post("/v1/embeddings", json=test_data) # Assert that aembedding was called, and that input was not modified mock_aembedding.assert_called_once() call_args, call_kwargs = mock_aembedding.call_args assert call_kwargs["model"] == "vllm_embed_model" assert call_kwargs["input"] == [[2046, 13269, 158208]] assert response.status_code == 200 result = response.json() print(len(result["data"][0]["embedding"])) assert len(result["data"][0]["embedding"]) > 10 # this usually has len==1536 so except Exception as e: pytest.fail(f"LiteLLM Proxy test failed. Exception - {str(e)}") @pytest.mark.asyncio async def test_get_all_team_models(): """ Test get_all_team_models function with both "*" and specific team IDs """ from unittest.mock import AsyncMock, MagicMock from litellm.proxy._types import LiteLLM_TeamTable from litellm.proxy.proxy_server import get_all_team_models # Mock team data mock_team1 = MagicMock() mock_team1.model_dump.return_value = { "team_id": "team1", "models": ["gpt-4", "gpt-3.5-turbo"], "team_alias": "Team 1", } mock_team2 = MagicMock() mock_team2.model_dump.return_value = { "team_id": "team2", "models": ["claude-3", "gpt-4"], "team_alias": "Team 2", } # Mock model data returned by router mock_models_gpt4 = [ {"model_info": {"id": "gpt-4-model-1"}}, {"model_info": {"id": "gpt-4-model-2"}}, ] mock_models_gpt35 = [ {"model_info": {"id": "gpt-3.5-turbo-model-1"}}, ] mock_models_claude = [ {"model_info": {"id": "claude-3-model-1"}}, ] # Mock prisma client mock_prisma_client = MagicMock() mock_db = MagicMock() mock_litellm_teamtable = MagicMock() mock_prisma_client.db = mock_db mock_db.litellm_teamtable = mock_litellm_teamtable # Make find_many async mock_litellm_teamtable.find_many = AsyncMock() # Mock router mock_router = MagicMock() def mock_get_model_list(model_name, team_id=None): if model_name == "gpt-4": return mock_models_gpt4 elif model_name == "gpt-3.5-turbo": return mock_models_gpt35 elif model_name == "claude-3": return mock_models_claude return None mock_router.get_model_list.side_effect = mock_get_model_list # Test Case 1: user_teams = "*" (all teams) mock_litellm_teamtable.find_many.return_value = [mock_team1, mock_team2] with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class: # Configure the mock class to return proper instances def mock_team_table_constructor(**kwargs): mock_instance = MagicMock() mock_instance.team_id = kwargs["team_id"] mock_instance.models = kwargs["models"] return mock_instance mock_team_table_class.side_effect = mock_team_table_constructor result = await get_all_team_models( user_teams="*", prisma_client=mock_prisma_client, llm_router=mock_router, ) # Verify find_many was called without where clause for "*" mock_litellm_teamtable.find_many.assert_called_with() # Verify router.get_model_list was called for each model expected_calls = [ mock.call(model_name="gpt-4", team_id="team1"), mock.call(model_name="gpt-3.5-turbo", team_id="team1"), mock.call(model_name="claude-3", team_id="team2"), mock.call(model_name="gpt-4", team_id="team2"), ] mock_router.get_model_list.assert_has_calls(expected_calls, any_order=True) # Test Case 2: user_teams = specific list mock_litellm_teamtable.reset_mock() mock_router.reset_mock() mock_router.get_model_list.side_effect = mock_get_model_list # Only return team1 for specific team query mock_litellm_teamtable.find_many.return_value = [mock_team1] with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class: mock_team_table_class.side_effect = mock_team_table_constructor result = await get_all_team_models( user_teams=["team1"], prisma_client=mock_prisma_client, llm_router=mock_router, ) # Verify find_many was called with where clause for specific teams mock_litellm_teamtable.find_many.assert_called_with( where={"team_id": {"in": ["team1"]}} ) # Verify router.get_model_list was called only for team1 models expected_calls = [ mock.call(model_name="gpt-4", team_id="team1"), mock.call(model_name="gpt-3.5-turbo", team_id="team1"), ] mock_router.get_model_list.assert_has_calls(expected_calls, any_order=True) # Test Case 3: Empty teams list mock_litellm_teamtable.reset_mock() mock_router.reset_mock() mock_litellm_teamtable.find_many.return_value = [] result = await get_all_team_models( user_teams=[], prisma_client=mock_prisma_client, llm_router=mock_router, ) # Verify find_many was called with empty list mock_litellm_teamtable.find_many.assert_called_with(where={"team_id": {"in": []}}) # Should return empty list when no teams assert result == {} # Test Case 4: Router returns None for some models mock_litellm_teamtable.reset_mock() mock_router.reset_mock() mock_litellm_teamtable.find_many.return_value = [mock_team1] def mock_get_model_list_with_none(model_name, team_id=None): if model_name == "gpt-4": return mock_models_gpt4 # Return None for gpt-3.5-turbo to test None handling return None mock_router.get_model_list.side_effect = mock_get_model_list_with_none with patch("litellm.proxy.proxy_server.LiteLLM_TeamTable") as mock_team_table_class: mock_team_table_class.side_effect = mock_team_table_constructor result = await get_all_team_models( user_teams=["team1"], prisma_client=mock_prisma_client, llm_router=mock_router, ) # Should handle None return gracefully assert isinstance(result, dict) print("result: ", result) assert result == {"gpt-4-model-1": ["team1"], "gpt-4-model-2": ["team1"]} def test_add_team_models_to_all_models(): """ Test add_team_models_to_all_models function """ from litellm.proxy._types import LiteLLM_TeamTable from litellm.proxy.proxy_server import _add_team_models_to_all_models team_db_objects_typed = MagicMock(spec=LiteLLM_TeamTable) team_db_objects_typed.team_id = "team1" team_db_objects_typed.models = ["all-proxy-models"] llm_router = MagicMock() llm_router.get_model_list.return_value = [ {"model_info": {"id": "gpt-4-model-1", "team_id": "team2"}}, {"model_info": {"id": "gpt-4-model-2"}}, ] result = _add_team_models_to_all_models( team_db_objects_typed=[team_db_objects_typed], llm_router=llm_router, ) assert result == {"gpt-4-model-2": {"team1"}} @pytest.mark.asyncio async def test_delete_deployment_type_mismatch(): """ Test that the _delete_deployment function handles type mismatches correctly. Specifically test that models 12345678 and 12345679 are NOT deleted when they exist in both combined_id_list (as integers) and router_model_ids (as strings). This test reproduces the bug where type mismatch causes valid models to be deleted. """ from unittest.mock import MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig # Create mock ProxyConfig instance pc = ProxyConfig() pc.get_config = MagicMock( return_value={ "model_list": [ { "model_name": "openai-gpt-4o", "litellm_params": {"model": "gpt-4o"}, "model_info": {"id": 12345678}, }, { "model_name": "openai-gpt-4o", "litellm_params": {"model": "gpt-4o"}, "model_info": {"id": 12345679}, }, ] } ) # Mock llm_router with string IDs (this is the source of the type mismatch) mock_llm_router = MagicMock() mock_llm_router.get_model_ids.return_value = [ "a96e12e76b36a57cfae57a41288eb41567629cac89b4828c6f7074afc3534695", "a40186dd0fdb9b7282380277d7f57044d29de95bfbfcd7f4322b3493702d5cd3", "12345678", # String ID "12345679", # String ID ] # Track which deployments were deleted deleted_ids = [] def mock_delete_deployment(id): deleted_ids.append(id) return True # Simulate successful deletion mock_llm_router.delete_deployment = MagicMock(side_effect=mock_delete_deployment) # Mock get_config to return empty config (no config models) async def mock_get_config(config_file_path): return {} pc.get_config = MagicMock(side_effect=mock_get_config) # Patch the global llm_router with patch("litellm.proxy.proxy_server.llm_router", mock_llm_router), patch( "litellm.proxy.proxy_server.user_config_file_path", "test_config.yaml" ): # Call the function under test deleted_count = await pc._delete_deployment(db_models=[]) # Assertions: Models 12345678 and 12345679 should NOT be deleted # because they exist in combined_id_list (as integers) even though # router has them as strings # The function should delete the other 2 models that are not in combined_id_list assert deleted_count == 0, f"Expected 0 deletions, got {deleted_count}" # Verify that 12345678 and 12345679 were NOT deleted assert ( "12345678" not in deleted_ids ), f"Model 12345678 should NOT be deleted. Deleted IDs: {deleted_ids}" assert ( "12345679" not in deleted_ids ), f"Model 12345679 should NOT be deleted. Deleted IDs: {deleted_ids}" @pytest.mark.asyncio async def test_get_config_from_file(tmp_path, monkeypatch): """ Test the _get_config_from_file method of ProxyConfig class. Tests various scenarios: valid file, non-existent file, no file path, None config. """ import yaml from litellm.proxy.proxy_server import ProxyConfig # Create a ProxyConfig instance proxy_config = ProxyConfig() # Test Case 1: Valid YAML config file exists test_config = { "model_list": [{"model_name": "gpt-4", "litellm_params": {"model": "gpt-4"}}], "general_settings": {"master_key": "sk-test"}, "router_settings": {"enable_pre_call_checks": True}, "litellm_settings": {"drop_params": True}, } config_file = tmp_path / "test_config.yaml" with open(config_file, "w") as f: yaml.dump(test_config, f) # Clear global user_config_file_path for this test monkeypatch.setattr("litellm.proxy.proxy_server.user_config_file_path", None) result = await proxy_config._get_config_from_file(str(config_file)) assert result == test_config # Verify that user_config_file_path was set from litellm.proxy.proxy_server import user_config_file_path assert user_config_file_path == str(config_file) # Test Case 2: File path provided but file doesn't exist non_existent_file = tmp_path / "non_existent.yaml" with pytest.raises(Exception, match=f"Config file not found: {non_existent_file}"): await proxy_config._get_config_from_file(str(non_existent_file)) # Test Case 3: No file path provided (should return default config) monkeypatch.setattr("litellm.proxy.proxy_server.user_config_file_path", None) expected_default = { "model_list": [], "general_settings": {}, "router_settings": {}, "litellm_settings": {}, } result = await proxy_config._get_config_from_file(None) assert result == expected_default # Test Case 4: Empty YAML file (should raise exception for None config) empty_file = tmp_path / "empty_config.yaml" with open(empty_file, "w") as f: f.write("") # Write empty content which will result in None when loaded with pytest.raises(Exception, match="Config cannot be None or Empty."): await proxy_config._get_config_from_file(str(empty_file)) # Test Case 5: Using global user_config_file_path when no config_file_path provided monkeypatch.setattr( "litellm.proxy.proxy_server.user_config_file_path", str(config_file) ) result = await proxy_config._get_config_from_file(None) assert result == test_config def test_normalize_datetime_for_sorting(): """ Test the _normalize_datetime_for_sorting function. Tests various scenarios: None values, ISO format strings, datetime objects (naive and aware). """ from litellm.proxy.proxy_server import _normalize_datetime_for_sorting # Test Case 1: None value assert _normalize_datetime_for_sorting(None) is None # Test Case 2: ISO format string with 'Z' suffix dt_str_z = "2024-01-15T10:30:00Z" result = _normalize_datetime_for_sorting(dt_str_z) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc assert result.year == 2024 assert result.month == 1 assert result.day == 15 assert result.hour == 10 assert result.minute == 30 # Test Case 3: ISO format string without 'Z' suffix (naive) dt_str_naive = "2024-01-15T10:30:00" result = _normalize_datetime_for_sorting(dt_str_naive) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc # Test Case 4: ISO format string with timezone offset dt_str_tz = "2024-01-15T10:30:00+05:00" result = _normalize_datetime_for_sorting(dt_str_tz) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc # Should convert from +05:00 to UTC (subtract 5 hours) assert result.hour == 5 # 10:30 - 5 hours = 5:30 UTC # Test Case 5: Naive datetime object naive_dt = datetime(2024, 1, 15, 10, 30, 0) result = _normalize_datetime_for_sorting(naive_dt) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc assert result.year == 2024 assert result.month == 1 assert result.day == 15 # Test Case 6: Timezone-aware datetime object (non-UTC) from datetime import timedelta aware_dt = datetime(2024, 1, 15, 10, 30, 0, tzinfo=timezone(timedelta(hours=5))) result = _normalize_datetime_for_sorting(aware_dt) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc # Should convert from +05:00 to UTC assert result.hour == 5 # Test Case 7: UTC-aware datetime object utc_dt = datetime(2024, 1, 15, 10, 30, 0, tzinfo=timezone.utc) result = _normalize_datetime_for_sorting(utc_dt) assert result is not None assert isinstance(result, datetime) assert result.tzinfo == timezone.utc assert result == utc_dt # Test Case 8: Invalid string format invalid_str = "not-a-date" result = _normalize_datetime_for_sorting(invalid_str) assert result is None # Test Case 9: Invalid type (should return None) result = _normalize_datetime_for_sorting(12345) assert result is None @pytest.mark.asyncio async def test_add_proxy_budget_to_db_only_creates_user_no_keys(): """ Test that _add_proxy_budget_to_db only creates a user and no keys are added. This validates that generate_key_helper_fn is called with table_name="user" which should prevent key creation in LiteLLM_VerificationToken table. """ from unittest.mock import AsyncMock, patch import litellm from litellm.proxy.proxy_server import ProxyStartupEvent # Set up required litellm settings litellm.budget_duration = "30d" litellm.max_budget = 100.0 litellm_proxy_budget_name = "litellm-proxy-budget" # Mock generate_key_helper_fn to capture its call arguments mock_generate_key_helper = AsyncMock( return_value={ "user_id": litellm_proxy_budget_name, "max_budget": 100.0, "budget_duration": "30d", "spend": 0, "models": [], } ) # Patch generate_key_helper_fn in proxy_server where it's being called from with patch( "litellm.proxy.proxy_server.generate_key_helper_fn", mock_generate_key_helper ): # Call the function under test ProxyStartupEvent._add_proxy_budget_to_db(litellm_proxy_budget_name) # Allow async task to complete import asyncio await asyncio.sleep(0.1) # Verify that generate_key_helper_fn was called mock_generate_key_helper.assert_called_once() call_args = mock_generate_key_helper.call_args # Verify critical parameters that prevent key creation assert call_args.kwargs["request_type"] == "user" assert call_args.kwargs["table_name"] == "user" assert call_args.kwargs["user_id"] == litellm_proxy_budget_name assert call_args.kwargs["max_budget"] == 100.0 assert call_args.kwargs["budget_duration"] == "30d" assert call_args.kwargs["query_type"] == "update_data" @pytest.mark.asyncio async def test_custom_ui_sso_sign_in_handler_config_loading(): """ Test that custom_ui_sso_sign_in_handler from config gets properly loaded into the global variable """ import tempfile from unittest.mock import MagicMock, patch import yaml from litellm.proxy.proxy_server import ProxyConfig # Create a test config with custom_ui_sso_sign_in_handler test_config = { "general_settings": { "custom_ui_sso_sign_in_handler": "custom_hooks.custom_ui_sso_hook.custom_ui_sso_sign_in_handler" }, "model_list": [], "router_settings": {}, "litellm_settings": {}, } # Create temporary config file with tempfile.NamedTemporaryFile(mode="w", suffix=".yaml", delete=False) as f: yaml.dump(test_config, f) config_file_path = f.name # Mock the get_instance_fn to return a mock handler mock_custom_handler = MagicMock() try: with patch( "litellm.proxy.proxy_server.get_instance_fn", return_value=mock_custom_handler, ) as mock_get_instance: # Create ProxyConfig instance and load config proxy_config = ProxyConfig() # Create a mock router since load_config requires it mock_router = MagicMock() await proxy_config.load_config( router=mock_router, config_file_path=config_file_path ) # Verify get_instance_fn was called with correct parameters mock_get_instance.assert_called_with( value="custom_hooks.custom_ui_sso_hook.custom_ui_sso_sign_in_handler", config_file_path=config_file_path, ) # Verify the global variable was set from litellm.proxy.proxy_server import user_custom_ui_sso_sign_in_handler assert user_custom_ui_sso_sign_in_handler == mock_custom_handler finally: # Clean up temporary file import os os.unlink(config_file_path) @pytest.mark.asyncio async def test_load_environment_variables_direct_and_os_environ(): """ Test _load_environment_variables method with direct values and os.environ/ prefixed values """ from unittest.mock import patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test config with both direct values and os.environ/ prefixed values test_config = { "environment_variables": { "DIRECT_VAR": "direct_value", "NUMERIC_VAR": 12345, "BOOL_VAR": True, "SECRET_VAR": "os.environ/ACTUAL_SECRET_VAR", } } # Mock get_secret_str to return a resolved value mock_secret_value = "resolved_secret_value" with patch( "litellm.proxy.proxy_server.get_secret_str", return_value=mock_secret_value ) as mock_get_secret: with patch.dict( os.environ, {}, clear=False ): # Don't clear existing env vars, just track changes # Call the method under test proxy_config._load_environment_variables(test_config) # Verify direct environment variables were set correctly assert os.environ["DIRECT_VAR"] == "direct_value" assert os.environ["NUMERIC_VAR"] == "12345" # Should be converted to string assert os.environ["BOOL_VAR"] == "True" # Should be converted to string # Verify os.environ/ prefixed variable was resolved and set assert os.environ["SECRET_VAR"] == mock_secret_value # Verify get_secret_str was called with the correct value mock_get_secret.assert_called_once_with( secret_name="os.environ/ACTUAL_SECRET_VAR" ) @pytest.mark.asyncio async def test_load_environment_variables_litellm_license_and_edge_cases(): """ Test _load_environment_variables method with LITELLM_LICENSE special handling and edge cases """ from unittest.mock import MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test Case 1: LITELLM_LICENSE in environment_variables test_config_with_license = { "environment_variables": { "LITELLM_LICENSE": "test_license_key", "OTHER_VAR": "other_value", } } # Mock _license_check mock_license_check = MagicMock() mock_license_check.is_premium.return_value = True with patch("litellm.proxy.proxy_server._license_check", mock_license_check): with patch.dict(os.environ, {}, clear=False): # Call the method under test proxy_config._load_environment_variables(test_config_with_license) # Verify LITELLM_LICENSE was set in environment assert os.environ["LITELLM_LICENSE"] == "test_license_key" # Verify license check was updated assert mock_license_check.license_str == "test_license_key" mock_license_check.is_premium.assert_called_once() # Test Case 2: No environment_variables in config test_config_no_env_vars = {} # This should not raise any errors and should return without doing anything result = proxy_config._load_environment_variables(test_config_no_env_vars) assert result is None # Method returns None # Test Case 3: environment_variables is None test_config_none_env_vars = {"environment_variables": None} # This should not raise any errors and should return without doing anything result = proxy_config._load_environment_variables(test_config_none_env_vars) assert result is None # Method returns None # Test Case 4: os.environ/ prefix but get_secret_str returns None test_config_secret_none = { "environment_variables": {"FAILED_SECRET": "os.environ/NONEXISTENT_SECRET"} } with patch("litellm.proxy.proxy_server.get_secret_str", return_value=None): with patch.dict(os.environ, {}, clear=False): # Call the method under test proxy_config._load_environment_variables(test_config_secret_none) # Verify that the environment variable was not set when secret resolution fails assert "FAILED_SECRET" not in os.environ @pytest.mark.asyncio async def test_write_config_to_file(monkeypatch): """ Do not write config to file if store_model_in_db is True """ from unittest.mock import AsyncMock, MagicMock, mock_open, patch from litellm.proxy.proxy_server import ProxyConfig # Set store_model_in_db to True monkeypatch.setattr("litellm.proxy.proxy_server.store_model_in_db", True) # Mock prisma_client to not be None (so DB path is taken) mock_prisma_client = AsyncMock() mock_prisma_client.insert_data = AsyncMock() monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", mock_prisma_client) # Mock general_settings mock_general_settings = {"store_model_in_db": True} monkeypatch.setattr( "litellm.proxy.proxy_server.general_settings", mock_general_settings ) # Mock user_config_file_path test_config_path = "/tmp/test_config.yaml" monkeypatch.setattr( "litellm.proxy.proxy_server.user_config_file_path", test_config_path ) proxy_config = ProxyConfig() # Mock the open function to track if file writing is attempted mock_file_open = mock_open() with patch("builtins.open", mock_file_open), patch("yaml.dump") as mock_yaml_dump: # Call save_config with test data test_config = {"key": "value", "model_list": ["model1", "model2"]} await proxy_config.save_config(new_config=test_config) # Verify that file was NOT opened for writing (since store_model_in_db=True) mock_file_open.assert_not_called() mock_yaml_dump.assert_not_called() # Verify that database insert was called instead mock_prisma_client.insert_data.assert_called_once() # Verify the config passed to DB has model_list removed call_args = mock_prisma_client.insert_data.call_args assert call_args.kwargs["data"] == { "key": "value" } # model_list should be popped assert call_args.kwargs["table_name"] == "config" @pytest.mark.asyncio async def test_write_config_to_file_when_store_model_in_db_false(monkeypatch): """ Test that config IS written to file when store_model_in_db is False """ from unittest.mock import AsyncMock, MagicMock, mock_open, patch from litellm.proxy.proxy_server import ProxyConfig # Set store_model_in_db to False monkeypatch.setattr("litellm.proxy.proxy_server.store_model_in_db", False) # Mock prisma_client to be None (so file path is taken) monkeypatch.setattr("litellm.proxy.proxy_server.prisma_client", None) # Mock general_settings mock_general_settings = {"store_model_in_db": False} monkeypatch.setattr( "litellm.proxy.proxy_server.general_settings", mock_general_settings ) # Mock user_config_file_path test_config_path = "/tmp/test_config.yaml" monkeypatch.setattr( "litellm.proxy.proxy_server.user_config_file_path", test_config_path ) proxy_config = ProxyConfig() # Mock the open function and yaml.dump mock_file_open = mock_open() with patch("builtins.open", mock_file_open), patch("yaml.dump") as mock_yaml_dump: # Call save_config with test data test_config = {"key": "value", "other_key": "other_value"} await proxy_config.save_config(new_config=test_config) # Verify that file WAS opened for writing (since store_model_in_db=False) mock_file_open.assert_called_once_with(f"{test_config_path}", "w") # Verify yaml.dump was called with the config mock_yaml_dump.assert_called_once_with( test_config, mock_file_open.return_value.__enter__.return_value, default_flow_style=False, ) @pytest.mark.asyncio async def test_async_data_generator_midstream_error(): """ Test async_data_generator handles midstream error from async_post_call_streaming_hook Specifically testing the case where Azure Content Safety Guardrail returns an error """ from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import async_data_generator from litellm.proxy.utils import ProxyLogging # Create mock objects mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) mock_request_data = { "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "test"}], } # Mock response chunks - simulating normal streaming that gets interrupted mock_chunks = [ {"choices": [{"delta": {"content": "Hello"}}]}, {"choices": [{"delta": {"content": " world"}}]}, {"choices": [{"delta": {"content": " this"}}]}, ] # Mock the proxy_logging_obj mock_proxy_logging_obj = MagicMock(spec=ProxyLogging) # Mock async_post_call_streaming_iterator_hook to yield chunks async def mock_streaming_iterator(*args, **kwargs): for chunk in mock_chunks: yield chunk mock_proxy_logging_obj.async_post_call_streaming_iterator_hook = ( mock_streaming_iterator ) # Mock async_post_call_streaming_hook to return error on third chunk def mock_streaming_hook(*args, **kwargs): chunk = kwargs.get("response") # Return error message for the third chunk (simulating guardrail trigger) if chunk == mock_chunks[2]: return 'data: {"error": {"error": "Azure Content Safety Guardrail: Hate crossed severity 2, Got severity: 2"}}' # Return normal chunks for first two return chunk mock_proxy_logging_obj.async_post_call_streaming_hook = AsyncMock( side_effect=mock_streaming_hook ) mock_proxy_logging_obj.post_call_failure_hook = AsyncMock() # Mock the global proxy_logging_obj with patch("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj): # Create a mock response object mock_response = MagicMock() # Collect all yielded data from the generator yielded_data = [] try: async for data in async_data_generator( mock_response, mock_user_api_key_dict, mock_request_data ): yielded_data.append(data) except Exception as e: # If there's an exception, that's also part of what we want to test pass # Verify the results assert ( len(yielded_data) >= 3 ), f"Expected at least 3 chunks, got {len(yielded_data)}: {yielded_data}" # First two chunks should be normal data assert yielded_data[0].startswith( "data: " ), f"First chunk should start with 'data: ', got: {yielded_data[0]}" assert yielded_data[1].startswith( "data: " ), f"Second chunk should start with 'data: ', got: {yielded_data[1]}" # The error message should be yielded error_found = False done_found = False for data in yielded_data: if "Azure Content Safety Guardrail: Hate crossed severity 2" in data: error_found = True if "data: [DONE]" in data: done_found = True assert ( error_found ), f"Error message should be found in yielded data. Got: {yielded_data}" assert done_found, f"[DONE] message should be found at the end. Got: {yielded_data}" # Verify that the streaming hook was called for each chunk assert mock_proxy_logging_obj.async_post_call_streaming_hook.call_count == len( mock_chunks ) # Verify that post_call_failure_hook was NOT called (since this is not an exception case) mock_proxy_logging_obj.post_call_failure_hook.assert_not_called() def _has_nested_none_values(obj, path="root"): """ Recursively check if an object contains nested None values. Args: obj: The object to check path: Current path in the object tree (for debugging) Returns: List of paths where None values were found """ none_paths = [] if obj is None: none_paths.append(path) elif isinstance(obj, dict): for key, value in obj.items(): none_paths.extend(_has_nested_none_values(value, f"{path}.{key}")) elif isinstance(obj, (list, tuple)): for i, item in enumerate(obj): none_paths.extend(_has_nested_none_values(item, f"{path}[{i}]")) elif hasattr(obj, "__dict__"): # Handle object attributes for key, value in obj.__dict__.items(): if not key.startswith("_"): # Skip private attributes none_paths.extend(_has_nested_none_values(value, f"{path}.{key}")) return none_paths @pytest.mark.asyncio async def test_chat_completion_result_no_nested_none_values(): """ Test that chat_completion result doesn't have nested None values when using exclude_none=True """ from unittest.mock import AsyncMock, MagicMock, patch from fastapi import Request, Response from pydantic import BaseModel import litellm from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import chat_completion # Create a mock ModelResponse with nested None values mock_model_response = litellm.ModelResponse() mock_model_response.id = "test-id" mock_model_response.model = "gpt-3.5-turbo" mock_model_response.object = "chat.completion" mock_model_response.created = 1234567890 # Create message with None values that should be excluded mock_message = litellm.Message( content="Hello, world!", role="assistant", function_call=None, # This should be excluded tool_calls=None, # This should be excluded audio=None, # This should be excluded reasoning_content=None, # This should be excluded thinking_blocks=None, # This should be excluded annotations=None, # This should be excluded ) # Create choice with potential None values mock_choice = litellm.Choices( finish_reason="stop", index=0, message=mock_message, logprobs=None, # This should be excluded when exclude_none=True ) mock_model_response.choices = [mock_choice] setattr( mock_model_response, "usage", litellm.Usage(prompt_tokens=10, completion_tokens=5, total_tokens=15), ) # Verify the mock has None values before serialization raw_dict = mock_model_response.model_dump() none_paths_before = _has_nested_none_values(raw_dict) assert ( len(none_paths_before) > 0 ), "Mock should have None values before exclude_none=True" # Mock the request processing to return our mock response mock_base_processor = MagicMock() mock_base_processor.base_process_llm_request = AsyncMock( return_value=mock_model_response ) # Mock other dependencies mock_request = MagicMock(spec=Request) mock_response = MagicMock(spec=Response) mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) with patch( "litellm.proxy.proxy_server._read_request_body", return_value={"model": "gpt-3.5-turbo", "messages": []}, ), patch( "litellm.proxy.proxy_server.ProxyBaseLLMRequestProcessing", return_value=mock_base_processor, ): # Call the chat_completion function result = await chat_completion( request=mock_request, fastapi_response=mock_response, user_api_key_dict=mock_user_api_key_dict, ) # Verify the result is a dict (since isinstance(result, BaseModel) was True) assert isinstance(result, dict), f"Expected dict result, got {type(result)}" # Check that there are no nested None values in the result none_paths_after = _has_nested_none_values(result) assert ( len(none_paths_after) == 0 ), f"Result should not contain nested None values. Found None at: {none_paths_after}" # Verify essential fields are present assert "id" in result assert "model" in result assert "object" in result assert "created" in result assert "choices" in result assert "usage" in result # Verify that the choices contain the expected message content assert len(result["choices"]) == 1 assert result["choices"][0]["message"]["content"] == "Hello, world!" assert result["choices"][0]["message"]["role"] == "assistant" # Verify that None fields were excluded (should not be present in the dict) message = result["choices"][0]["message"] excluded_fields = [ "function_call", "tool_calls", "audio", "reasoning_content", "thinking_blocks", "annotations", ] for field in excluded_fields: assert ( field not in message ), f"Field '{field}' should be excluded when it's None" # ============================================================================ # Price Data Reload Tests # ============================================================================ class TestPriceDataReloadAPI: """Test cases for price data reload API endpoints""" @pytest.fixture def client_with_auth(self): """Create a test client with authentication""" from litellm.proxy._types import LitellmUserRoles from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" asyncio.run(initialize(config=config_fp, debug=True)) # Mock admin user authentication mock_auth = MagicMock() mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN app.dependency_overrides[user_api_key_auth] = lambda: mock_auth return TestClient(app) def test_reload_model_cost_map_admin_access(self, client_with_auth): """Test that admin users can access the reload endpoint""" # Save the original model_cost so the endpoint's direct assignment # (litellm.model_cost = new_model_cost_map) does not contaminate # subsequent tests running in the same worker process. original_model_cost = litellm.model_cost.copy() try: with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.return_value = { "gpt-3.5-turbo": {"input_cost_per_token": 0.001} } # Mock the database connection with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_config.find_unique = AsyncMock( return_value=None ) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) response = client_with_auth.post("/reload/model_cost_map") assert response.status_code == 200 data = response.json() assert data["status"] == "success" assert "message" in data assert "timestamp" in data assert "models_count" in data # The new implementation immediately reloads and returns the count assert ( "Price data reloaded successfully! 1 models updated." in data["message"] ) assert data["models_count"] == 1 finally: # Restore the full model cost map so subsequent tests are not affected litellm.model_cost = original_model_cost _invalidate_model_cost_lowercase_map() def test_reload_model_cost_map_non_admin_access(self, client_with_auth): """Test that non-admin users cannot access the reload endpoint""" # Mock non-admin user mock_auth = MagicMock() mock_auth.user_role = "user" # Non-admin role app.dependency_overrides[user_api_key_auth] = lambda: mock_auth response = client_with_auth.post("/reload/model_cost_map") assert response.status_code == 403 data = response.json() assert "Access denied" in data["detail"] assert "Admin role required" in data["detail"] def test_get_model_cost_map_public_access(self, client_no_auth): """Test that the model cost map endpoint is publicly accessible""" with patch( "litellm.model_cost", {"gpt-3.5-turbo": {"input_cost_per_token": 0.001}} ): response = client_no_auth.get("/public/litellm_model_cost_map") assert response.status_code == 200 data = response.json() assert "gpt-3.5-turbo" in data def test_reload_model_cost_map_error_handling(self, client_with_auth): """Test error handling in the reload endpoint""" with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.side_effect = Exception("Network error") # Mock the database connection with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_config.find_unique = AsyncMock( return_value=None ) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) response = client_with_auth.post("/reload/model_cost_map") assert ( response.status_code == 500 ) # The new implementation immediately reloads and fails on error data = response.json() assert "Failed to reload model cost map" in data["detail"] def test_schedule_model_cost_map_reload_admin_access(self, client_with_auth): """Test that admin users can schedule periodic reload""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Mock database upsert mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) response = client_with_auth.post("/schedule/model_cost_map_reload?hours=6") assert response.status_code == 200 data = response.json() assert data["status"] == "success" assert data["interval_hours"] == 6 assert "message" in data assert "timestamp" in data def test_schedule_model_cost_map_reload_non_admin_access(self, client_with_auth): """Test that non-admin users cannot schedule periodic reload""" # Mock non-admin user mock_auth = MagicMock() mock_auth.user_role = "user" # Non-admin role app.dependency_overrides[user_api_key_auth] = lambda: mock_auth response = client_with_auth.post("/schedule/model_cost_map_reload?hours=6") assert response.status_code == 403 data = response.json() assert "Access denied" in data["detail"] assert "Admin role required" in data["detail"] def test_schedule_model_cost_map_reload_invalid_hours(self, client_with_auth): """Test that invalid hours parameter is rejected""" response = client_with_auth.post("/schedule/model_cost_map_reload?hours=0") assert response.status_code == 400 data = response.json() assert "Hours must be greater than 0" in data["detail"] def test_cancel_model_cost_map_reload_admin_access(self, client_with_auth): """Test that admin users can cancel periodic reload""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Mock database delete mock_prisma.db.litellm_config.delete = AsyncMock(return_value=None) response = client_with_auth.delete("/schedule/model_cost_map_reload") assert response.status_code == 200 data = response.json() assert data["status"] == "success" assert "message" in data assert "timestamp" in data def test_cancel_model_cost_map_reload_non_admin_access(self, client_with_auth): """Test that non-admin users cannot cancel periodic reload""" # Mock non-admin user mock_auth = MagicMock() mock_auth.user_role = "user" # Non-admin role app.dependency_overrides[user_api_key_auth] = lambda: mock_auth response = client_with_auth.delete("/schedule/model_cost_map_reload") assert response.status_code == 403 data = response.json() assert "Access denied" in data["detail"] assert "Admin role required" in data["detail"] def test_get_model_cost_map_reload_status_admin_access(self, client_with_auth): """Test that admin users can get reload status""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Mock database config record mock_config = MagicMock() mock_config.param_value = {"interval_hours": 6, "force_reload": False} mock_prisma.db.litellm_config.find_unique = AsyncMock( return_value=mock_config ) # Mock the last reload time and current time with patch( "litellm.proxy.proxy_server.last_model_cost_map_reload", "2024-01-01T06:00:00", ): with patch("litellm.proxy.proxy_server.datetime") as mock_datetime: # Mock current time to be 1 hour after last reload mock_datetime.utcnow.return_value = datetime(2024, 1, 1, 7, 0, 0) mock_datetime.fromisoformat = datetime.fromisoformat response = client_with_auth.get( "/schedule/model_cost_map_reload/status" ) assert response.status_code == 200 data = response.json() assert data["scheduled"] == True assert data["interval_hours"] == 6 assert data["last_run"] == "2024-01-01T06:00:00" assert data["next_run"] == "2024-01-01T12:00:00" def test_get_model_cost_map_reload_status_non_admin_access(self, client_with_auth): """Test that non-admin users cannot get reload status""" # Mock non-admin user mock_auth = MagicMock() mock_auth.user_role = "user" # Non-admin role app.dependency_overrides[user_api_key_auth] = lambda: mock_auth response = client_with_auth.get("/schedule/model_cost_map_reload/status") assert response.status_code == 403 data = response.json() assert "Access denied" in data["detail"] assert "Admin role required" in data["detail"] def test_get_model_cost_map_reload_status_no_config(self, client_with_auth): """Test that status returns not scheduled when no config exists""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=None) response = client_with_auth.get("/schedule/model_cost_map_reload/status") assert response.status_code == 200 data = response.json() assert data["scheduled"] == False assert data["interval_hours"] == None assert data["last_run"] == None assert data["next_run"] == None def test_get_model_cost_map_reload_status_no_interval(self, client_with_auth): """Test that status returns not scheduled when no interval is configured""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Mock config with no interval mock_config = MagicMock() mock_config.param_value = {"interval_hours": None, "force_reload": False} mock_prisma.db.litellm_config.find_unique = AsyncMock( return_value=mock_config ) response = client_with_auth.get("/schedule/model_cost_map_reload/status") assert response.status_code == 200 data = response.json() assert data["scheduled"] == False assert data["interval_hours"] == None assert data["last_run"] == None assert data["next_run"] == None class TestPriceDataReloadIntegration: """Integration tests for the complete price data reload feature""" @pytest.fixture def client_with_auth(self): """Create a test client with authentication""" from litellm.proxy._types import LitellmUserRoles from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" asyncio.run(initialize(config=config_fp, debug=True)) # Mock admin user authentication mock_auth = MagicMock() mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN app.dependency_overrides[user_api_key_auth] = lambda: mock_auth return TestClient(app) def test_complete_reload_flow(self, client_with_auth): """Test the complete reload flow from API to model cost update""" # Mock the model cost map mock_cost_map = { "gpt-3.5-turbo": { "input_cost_per_token": 0.001, "output_cost_per_token": 0.002, }, "gpt-4": {"input_cost_per_token": 0.03, "output_cost_per_token": 0.06}, } original_model_cost = litellm.model_cost.copy() try: with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.return_value = mock_cost_map # Mock the database connection with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_config.find_unique = AsyncMock( return_value=None ) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) # Test reload endpoint response = client_with_auth.post("/reload/model_cost_map") assert response.status_code == 200 # Test get endpoint response = client_with_auth.get("/public/litellm_model_cost_map") assert response.status_code == 200 finally: litellm.model_cost = original_model_cost _invalidate_model_cost_lowercase_map() def test_distributed_reload_check_function(self): """Test the _check_and_reload_model_cost_map function""" from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock prisma client mock_prisma = MagicMock() # Test case 1: No config in database mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=None) # Should return early without reloading asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma)) # Test case 2: Config with interval but not time to reload mock_config = MagicMock() mock_config.param_value = {"interval_hours": 6, "force_reload": False} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config) # Mock current time and last reload time with patch( "litellm.proxy.proxy_server.last_model_cost_map_reload", "2024-01-01T06:00:00", ): with patch("litellm.proxy.proxy_server.datetime") as mock_datetime: mock_datetime.utcnow.return_value = datetime( 2024, 1, 1, 7, 0, 0 ) # 1 hour later # Should not reload (only 1 hour passed, need 6) asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma)) # Test case 3: Config with force reload mock_config.param_value = {"interval_hours": 6, "force_reload": True} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) original_model_cost = litellm.model_cost.copy() try: with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.return_value = { "gpt-3.5-turbo": {"input_cost_per_token": 0.001} } # Should reload due to force flag asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma)) # Verify force_reload was reset to False mock_prisma.db.litellm_config.upsert.assert_called() call_args = mock_prisma.db.litellm_config.upsert.call_args # The param_value is now a JSON string, so we need to parse it param_value_json = call_args[1]["data"]["update"]["param_value"] param_value_dict = json.loads(param_value_json) assert param_value_dict["force_reload"] == False assert param_value_dict.get("interval_hours") == 6 finally: litellm.model_cost = original_model_cost _invalidate_model_cost_lowercase_map() def test_distributed_reload_preserves_interval_hours(self): """Test that _check_and_reload_model_cost_map preserves interval_hours after reload. Regression test: the update branch of the upsert was previously dropping interval_hours, causing scheduled reloads to self-destruct after first execution. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() mock_prisma = MagicMock() # Set up config with interval_hours=24 and force_reload=True to trigger reload mock_config = MagicMock() mock_config.param_value = {"interval_hours": 24, "force_reload": True} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) original_model_cost = litellm.model_cost.copy() try: with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.return_value = {"gpt-4": {"input_cost_per_token": 0.001}} asyncio.run(proxy_config._check_and_reload_model_cost_map(mock_prisma)) # Verify the upsert update branch preserves interval_hours mock_prisma.db.litellm_config.upsert.assert_called() call_args = mock_prisma.db.litellm_config.upsert.call_args param_value_json = call_args[1]["data"]["update"]["param_value"] param_value_dict = json.loads(param_value_json) assert param_value_dict["force_reload"] == False assert param_value_dict["interval_hours"] == 24, ( "interval_hours must be preserved in the update branch; " "dropping it causes the schedule to self-destruct" ) finally: litellm.model_cost = original_model_cost _invalidate_model_cost_lowercase_map() def test_manual_reload_preserves_interval_hours(self): """Test that manual reload via /reload/model_cost_map preserves existing interval_hours. Regression test: the manual reload endpoint was overwriting param_value with only force_reload=True, dropping any existing interval_hours schedule. """ from litellm.proxy._types import LitellmUserRoles from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" asyncio.run(initialize(config=config_fp, debug=True)) mock_auth = MagicMock() mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN app.dependency_overrides[user_api_key_auth] = lambda: mock_auth client = TestClient(app) original_model_cost = litellm.model_cost.copy() try: with patch( "litellm.litellm_core_utils.get_model_cost_map.get_model_cost_map" ) as mock_get_map: mock_get_map.return_value = {"gpt-4": {"input_cost_per_token": 0.001}} with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Simulate existing config with a schedule mock_existing = MagicMock() mock_existing.param_value = {"interval_hours": 12, "force_reload": False} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_existing) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) response = client.post("/reload/model_cost_map") assert response.status_code == 200 # Verify interval_hours was preserved in the upsert mock_prisma.db.litellm_config.upsert.assert_called() call_args = mock_prisma.db.litellm_config.upsert.call_args param_value_json = call_args[1]["data"]["update"]["param_value"] param_value_dict = json.loads(param_value_json) assert param_value_dict["force_reload"] == True assert param_value_dict["interval_hours"] == 12, ( "interval_hours must be preserved when manual reload sets force_reload; " "dropping it destroys any existing schedule" ) finally: litellm.model_cost = original_model_cost _invalidate_model_cost_lowercase_map() def test_anthropic_beta_headers_reload_preserves_interval_hours(self): """Test that _check_and_reload_anthropic_beta_headers preserves interval_hours after reload. Regression test: the update branch of the upsert was dropping interval_hours, identical to the model cost map bug. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() mock_prisma = MagicMock() # Set up config with interval_hours=12 and force_reload=True to trigger reload mock_config = MagicMock() mock_config.param_value = {"interval_hours": 12, "force_reload": True} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_config) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) with patch( "litellm.anthropic_beta_headers_manager.reload_beta_headers_config" ) as mock_reload: mock_reload.return_value = {"anthropic": {"beta_header": "test-value"}} asyncio.run(proxy_config._check_and_reload_anthropic_beta_headers(mock_prisma)) # Verify the upsert update branch preserves interval_hours mock_prisma.db.litellm_config.upsert.assert_called() call_args = mock_prisma.db.litellm_config.upsert.call_args param_value_json = call_args[1]["data"]["update"]["param_value"] param_value_dict = json.loads(param_value_json) assert param_value_dict["force_reload"] == False assert param_value_dict["interval_hours"] == 12, ( "interval_hours must be preserved in the update branch; " "dropping it causes the schedule to self-destruct" ) def test_anthropic_beta_headers_manual_reload_preserves_interval_hours(self): """Test that manual reload via /reload/anthropic_beta_headers preserves existing interval_hours. Regression test: the manual reload endpoint was overwriting param_value with only force_reload=True, dropping any existing interval_hours schedule. """ from litellm.proxy._types import LitellmUserRoles from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" asyncio.run(initialize(config=config_fp, debug=True)) mock_auth = MagicMock() mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN app.dependency_overrides[user_api_key_auth] = lambda: mock_auth client = TestClient(app) with patch( "litellm.anthropic_beta_headers_manager.reload_beta_headers_config" ) as mock_reload: mock_reload.return_value = {"anthropic": {"beta_header": "test-value"}} with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: # Simulate existing config with a schedule mock_existing = MagicMock() mock_existing.param_value = {"interval_hours": 8, "force_reload": False} mock_prisma.db.litellm_config.find_unique = AsyncMock(return_value=mock_existing) mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) response = client.post("/reload/anthropic_beta_headers") assert response.status_code == 200 # Verify interval_hours was preserved in the upsert mock_prisma.db.litellm_config.upsert.assert_called() call_args = mock_prisma.db.litellm_config.upsert.call_args param_value_json = call_args[1]["data"]["update"]["param_value"] param_value_dict = json.loads(param_value_json) assert param_value_dict["force_reload"] == True assert param_value_dict["interval_hours"] == 8, ( "interval_hours must be preserved when manual reload sets force_reload; " "dropping it destroys any existing schedule" ) def test_config_file_parsing(self): """Test parsing of config file with reload settings""" config_content = """ general_settings: master_key: sk-1234 model_cost_map_reload_interval: 21600 model_list: - model_name: gpt-3.5-turbo litellm_params: model: gpt-3.5-turbo - model_name: gpt-4 litellm_params: model: gpt-4 """ # Parse the config config = yaml.safe_load(config_content) # Verify the reload setting is present assert "general_settings" in config assert "model_cost_map_reload_interval" in config["general_settings"] assert config["general_settings"]["model_cost_map_reload_interval"] == 21600 # Verify models are present assert "model_list" in config assert len(config["model_list"]) == 2 def test_database_config_storage(self): """Test that configuration is properly stored in database""" # Mock prisma client mock_prisma = MagicMock() # Test the database upsert call that would be made by the schedule endpoint mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) # Simulate the database call that the schedule endpoint would make asyncio.run( mock_prisma.db.litellm_config.upsert( where={"param_name": "model_cost_map_reload_config"}, data={ "create": { "param_name": "model_cost_map_reload_config", "param_value": {"interval_hours": 6, "force_reload": False}, }, "update": { "param_value": {"interval_hours": 6, "force_reload": False} }, }, ) ) # Verify database upsert was called with correct data mock_prisma.db.litellm_config.upsert.assert_called_once() call_args = mock_prisma.db.litellm_config.upsert.call_args assert call_args[1]["where"]["param_name"] == "model_cost_map_reload_config" assert call_args[1]["data"]["create"]["param_value"]["interval_hours"] == 6 assert call_args[1]["data"]["create"]["param_value"]["force_reload"] == False def test_manual_reload_force_flag(self): """Test that manual reload sets force flag correctly""" # Mock prisma client mock_prisma = MagicMock() # Test the database upsert call that would be made by the manual reload endpoint mock_prisma.db.litellm_config.upsert = AsyncMock(return_value=None) # Simulate the database call that the manual reload endpoint would make asyncio.run( mock_prisma.db.litellm_config.upsert( where={"param_name": "model_cost_map_reload_config"}, data={ "create": { "param_name": "model_cost_map_reload_config", "param_value": {"interval_hours": None, "force_reload": True}, }, "update": {"param_value": {"force_reload": True}}, }, ) ) # Verify force_reload flag was set mock_prisma.db.litellm_config.upsert.assert_called_once() call_args = mock_prisma.db.litellm_config.upsert.call_args assert call_args[1]["data"]["update"]["param_value"]["force_reload"] == True @pytest.mark.asyncio async def test_add_router_settings_from_db_config_merge_logic(): """ Test the _add_router_settings_from_db_config method's merge logic. This tests how router settings from config file and database are combined, including scenarios where nested dictionaries should be properly merged. """ from unittest.mock import AsyncMock, MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig # Create ProxyConfig instance proxy_config = ProxyConfig() # Mock router mock_router = MagicMock() mock_router.update_settings = MagicMock() # Test Case 1: Both config and DB settings exist - should merge them config_data = { "router_settings": { "routing_strategy": "usage-based-routing", "model_group_alias": {"gpt-4": "openai-gpt-4"}, "enable_pre_call_checks": True, "timeout": 30, "nested_config": {"setting1": "config_value1", "setting2": "config_value2"}, } } # Mock database config record mock_db_config = MagicMock() mock_db_config.param_value = { "routing_strategy": "least-busy", # This should override config value "retry_delay": 2, # This is new, should be added "nested_config": { "setting2": "db_value2", # This should override config value "setting3": "db_value3", # This is new, should be added }, } # Mock prisma client mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_config.find_first = AsyncMock( return_value=mock_db_config ) # Call the method under test await proxy_config._add_router_settings_from_db_config( config_data=config_data, llm_router=mock_router, prisma_client=mock_prisma_client, ) # Verify find_first was called with correct parameters mock_prisma_client.db.litellm_config.find_first.assert_called_once_with( where={"param_name": "router_settings"} ) # Verify update_settings was called mock_router.update_settings.assert_called_once() # Get the actual settings passed to update_settings call_args = mock_router.update_settings.call_args combined_settings = call_args[1] # kwargs # Verify the merge results # DB values should override config values assert combined_settings["routing_strategy"] == "least-busy" # Config-only values should be preserved assert combined_settings["model_group_alias"] == {"gpt-4": "openai-gpt-4"} assert combined_settings["enable_pre_call_checks"] == True assert combined_settings["timeout"] == 30 # DB-only values should be added assert combined_settings["retry_delay"] == 2 # Nested dictionaries should be merged (but this is shallow merge) expected_nested = { "setting1": "config_value1", "setting2": "db_value2", "setting3": "db_value3", } assert combined_settings["nested_config"] == expected_nested @pytest.mark.asyncio async def test_add_router_settings_from_db_config_edge_cases(): """ Test edge cases for _add_router_settings_from_db_config method. """ from unittest.mock import AsyncMock, MagicMock from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() mock_router = MagicMock() mock_router.update_settings = MagicMock() # Test Case 1: No router provided await proxy_config._add_router_settings_from_db_config( config_data={"router_settings": {"test": "value"}}, llm_router=None, prisma_client=MagicMock(), ) # Should not call anything when router is None mock_router.update_settings.assert_not_called() # Test Case 2: No prisma client provided await proxy_config._add_router_settings_from_db_config( config_data={"router_settings": {"test": "value"}}, llm_router=mock_router, prisma_client=None, ) # Should not call anything when prisma_client is None mock_router.update_settings.assert_not_called() # Test Case 3: DB returns None (no router_settings in DB) mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None) config_data = {"router_settings": {"routing_strategy": "usage-based"}} await proxy_config._add_router_settings_from_db_config( config_data=config_data, llm_router=mock_router, prisma_client=mock_prisma_client, ) # Should use only config settings mock_router.update_settings.assert_called_once_with(routing_strategy="usage-based") mock_router.reset_mock() # Test Case 4: Config has no router_settings mock_db_config = MagicMock() mock_db_config.param_value = {"db_setting": "db_value"} mock_prisma_client.db.litellm_config.find_first = AsyncMock( return_value=mock_db_config ) await proxy_config._add_router_settings_from_db_config( config_data={}, # No router_settings in config llm_router=mock_router, prisma_client=mock_prisma_client, ) # Should use only DB settings mock_router.update_settings.assert_called_once_with(db_setting="db_value") mock_router.reset_mock() # Test Case 5: Both config and DB router_settings are None/empty mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None) await proxy_config._add_router_settings_from_db_config( config_data={}, llm_router=mock_router, prisma_client=mock_prisma_client ) # Should not call update_settings when no settings exist mock_router.update_settings.assert_not_called() # Test Case 6: DB config exists but param_value is not a dict mock_db_config_invalid = MagicMock() mock_db_config_invalid.param_value = "not_a_dict" mock_prisma_client.db.litellm_config.find_first = AsyncMock( return_value=mock_db_config_invalid ) config_data = {"router_settings": {"config_setting": "config_value"}} await proxy_config._add_router_settings_from_db_config( config_data=config_data, llm_router=mock_router, prisma_client=mock_prisma_client, ) # Should use only config settings when DB param_value is invalid mock_router.update_settings.assert_called_once_with(config_setting="config_value") @pytest.mark.asyncio async def test_add_router_settings_shallow_merge_behavior(): """ Test that the merge behavior is shallow (nested dicts get replaced, not merged). This documents the current behavior using _update_dictionary. """ from unittest.mock import AsyncMock, MagicMock from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() mock_router = MagicMock() mock_router.update_settings = MagicMock() # Config with nested dictionary config_data = { "router_settings": { "nested_setting": { "key1": "config_value1", "key2": "config_value2", "key3": "config_value3", }, "top_level": "config_top", } } # DB config that partially overlaps the nested dictionary mock_db_config = MagicMock() mock_db_config.param_value = { "nested_setting": { "key2": "db_value2", # Override existing key "key4": "db_value4", # Add new key # Note: key1 and key3 from config will be lost due to shallow merge }, "top_level": "db_top", # Override top level } mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_config.find_first = AsyncMock( return_value=mock_db_config ) await proxy_config._add_router_settings_from_db_config( config_data=config_data, llm_router=mock_router, prisma_client=mock_prisma_client, ) # Get the merged settings call_args = mock_router.update_settings.call_args merged_settings = call_args[1] # Verify shallow merge behavior: # The entire nested_setting dict from config is replaced by the DB version expected_nested = { "key1": "config_value1", "key3": "config_value3", "key2": "db_value2", "key4": "db_value4", } assert merged_settings["nested_setting"] == expected_nested assert merged_settings["top_level"] == "db_top" @pytest.mark.asyncio async def test_model_info_v1_oci_secrets_not_leaked(): """ Test that model_info_v1 endpoint properly masks OCI sensitive parameters and does not leak secrets. """ from unittest.mock import MagicMock, patch from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import model_info_v1 # Mock user authentication mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) mock_user_api_key_dict.user_id = "test-user" mock_user_api_key_dict.api_key = "test-key" mock_user_api_key_dict.team_models = [] mock_user_api_key_dict.models = ["oci-grok-test"] # Mock model data with OCI sensitive information mock_model_data = { "model_name": "oci-grok-test", "litellm_params": { "model": "oci/xai.grok-4", "oci_key": "ocid1.api_key.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk", "oci_region": "us-phoenix-1", "oci_user": "ocid1.user.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk", "oci_fingerprint": "aa:bb:cc:dd:ee:ff:11:22:33:44:55:66:77:88:99:00", "oci_tenancy": "ocid1.tenancy.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk", "oci_key_file": "/path/to/oci_api_key.pem", "oci_compartment_id": "ocid1.compartment.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk", "drop_params": True }, "model_info": { "mode": "completion", "id": "test-model-id" } } # Mock the llm_router to return our test data mock_router = MagicMock() mock_router.get_model_names.return_value = ["oci-grok-test"] mock_router.get_model_access_groups.return_value = {} mock_router.get_model_list.return_value = [mock_model_data] # Mock global variables with patch("litellm.proxy.proxy_server.llm_router", mock_router), \ patch("litellm.proxy.proxy_server.llm_model_list", [mock_model_data]), \ patch("litellm.proxy.proxy_server.general_settings", {"infer_model_from_keys": False}), \ patch("litellm.proxy.proxy_server.user_model", None): # Call the model_info_v1 endpoint result = await model_info_v1( user_api_key_dict=mock_user_api_key_dict, litellm_model_id=None ) # Verify the result structure assert "data" in result assert len(result["data"]) == 1 model_info = result["data"][0] litellm_params = model_info["litellm_params"] # Verify that sensitive OCI fields are masked assert "****" in litellm_params["oci_key"], "oci_key should be masked" assert "****" in litellm_params["oci_fingerprint"], "oci_fingerprint should be masked" assert "****" in litellm_params["oci_tenancy"], "oci_tenancy should be masked" assert "****" in litellm_params["oci_key_file"], "oci_key_file should be masked" # Verify that non-sensitive fields are NOT masked assert litellm_params["model"] == "oci/xai.grok-4", "model field should not be masked" assert litellm_params["oci_region"] == "us-phoenix-1", "oci_region should not be masked" assert litellm_params["drop_params"] is True, "drop_params should not be masked" # Verify the model field specifically is not masked (this was the original issue) assert "****" not in litellm_params["model"], "model field should never be masked" assert litellm_params["model"].startswith("oci/"), "model should retain its full value" # Verify that actual secret values are not present in the response result_str = str(result) assert "ocid1.api_key.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk" not in result_str assert "aa:bb:cc:dd:ee:ff:11:22:33:44:55:66:77:88:99:00" not in result_str assert "ocid1.tenancy.oc1..aaaaaaaa7kbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbkbk" not in result_str assert "/path/to/oci_api_key.pem" not in result_str def test_add_callback_from_db_to_in_memory_litellm_callbacks(): """ Test that _add_callback_from_db_to_in_memory_litellm_callbacks correctly adds callbacks for success, failure, and combined event types. """ from unittest.mock import MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock the callback manager mock_callback_manager = MagicMock() with patch("litellm.proxy.proxy_server.litellm") as mock_litellm: # Set up mock litellm attributes mock_litellm._known_custom_logger_compatible_callbacks = [] mock_litellm.logging_callback_manager = mock_callback_manager # Test Case 1: Add success callback mock_success_callbacks = [] proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks( callback="prometheus", event_types=["success"], existing_callbacks=mock_success_callbacks, ) mock_callback_manager.add_litellm_success_callback.assert_called_once_with("prometheus") mock_callback_manager.reset_mock() # Test Case 2: Add failure callback mock_failure_callbacks = [] proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks( callback="langfuse", event_types=["failure"], existing_callbacks=mock_failure_callbacks, ) mock_callback_manager.add_litellm_failure_callback.assert_called_once_with("langfuse") mock_callback_manager.reset_mock() # Test Case 3: Add callback for both success and failure mock_callbacks = [] proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks( callback="s3", event_types=["success", "failure"], existing_callbacks=mock_callbacks, ) mock_callback_manager.add_litellm_callback.assert_called_once_with("s3") mock_callback_manager.reset_mock() # Test Case 4: Don't add callback if it already exists existing_callbacks_with_item = ["prometheus"] proxy_config._add_callback_from_db_to_in_memory_litellm_callbacks( callback="prometheus", event_types=["success"], existing_callbacks=existing_callbacks_with_item, ) mock_callback_manager.add_litellm_success_callback.assert_not_called() def test_should_load_db_object_with_supported_db_objects(): """ Test _should_load_db_object method with supported_db_objects configuration. Verifies that when supported_db_objects is set, only specified object types are loaded from the database. """ from unittest.mock import patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test Case 1: supported_db_objects not set - all objects should be loaded with patch("litellm.proxy.proxy_server.general_settings", {}): assert proxy_config._should_load_db_object(object_type="models") is True assert proxy_config._should_load_db_object(object_type="mcp") is True assert proxy_config._should_load_db_object(object_type="guardrails") is True assert proxy_config._should_load_db_object(object_type="vector_stores") is True # Test Case 2: supported_db_objects set to only load MCP with patch( "litellm.proxy.proxy_server.general_settings", {"supported_db_objects": ["mcp"]}, ): assert proxy_config._should_load_db_object(object_type="models") is False assert proxy_config._should_load_db_object(object_type="mcp") is True assert proxy_config._should_load_db_object(object_type="guardrails") is False assert proxy_config._should_load_db_object(object_type="vector_stores") is False assert proxy_config._should_load_db_object(object_type="prompts") is False # Test Case 3: supported_db_objects set to load multiple types with patch( "litellm.proxy.proxy_server.general_settings", {"supported_db_objects": ["mcp", "guardrails", "vector_stores"]}, ): assert proxy_config._should_load_db_object(object_type="models") is False assert proxy_config._should_load_db_object(object_type="mcp") is True assert proxy_config._should_load_db_object(object_type="guardrails") is True assert proxy_config._should_load_db_object(object_type="vector_stores") is True assert proxy_config._should_load_db_object(object_type="prompts") is False # Test Case 4: supported_db_objects is not a list (should default to loading all) with patch( "litellm.proxy.proxy_server.general_settings", {"supported_db_objects": "invalid_type"}, ): assert proxy_config._should_load_db_object(object_type="models") is True assert proxy_config._should_load_db_object(object_type="mcp") is True # Test Case 5: supported_db_objects is an empty list (nothing should be loaded) with patch( "litellm.proxy.proxy_server.general_settings", {"supported_db_objects": []}, ): assert proxy_config._should_load_db_object(object_type="models") is False assert proxy_config._should_load_db_object(object_type="mcp") is False assert proxy_config._should_load_db_object(object_type="guardrails") is False # Test Case 6: Test all available object types with patch( "litellm.proxy.proxy_server.general_settings", { "supported_db_objects": [ "models", "mcp", "guardrails", "vector_stores", "pass_through_endpoints", "prompts", "model_cost_map", ] }, ): assert proxy_config._should_load_db_object(object_type="models") is True assert proxy_config._should_load_db_object(object_type="mcp") is True assert proxy_config._should_load_db_object(object_type="guardrails") is True assert proxy_config._should_load_db_object(object_type="vector_stores") is True assert ( proxy_config._should_load_db_object(object_type="pass_through_endpoints") is True ) assert proxy_config._should_load_db_object(object_type="prompts") is True assert proxy_config._should_load_db_object(object_type="model_cost_map") is True @pytest.mark.asyncio async def test_tag_cache_update_called(): """ Test that update_cache updates tag cache when tags are provided. """ from litellm.caching.caching import DualCache from litellm.proxy.proxy_server import user_api_key_cache cache = DualCache() setattr( litellm.proxy.proxy_server, "user_api_key_cache", cache, ) mock_tag_obj = { "tag_name": "test-tag", "spend": 10.0, } with patch.object(cache, "async_get_cache", new=AsyncMock(return_value=mock_tag_obj)) as mock_get_cache: with patch.object(cache, "async_set_cache_pipeline", new=AsyncMock()) as mock_set_cache: await litellm.proxy.proxy_server.update_cache( token=None, user_id=None, end_user_id=None, team_id=None, response_cost=5.0, parent_otel_span=None, tags=["test-tag"], ) await asyncio.sleep(0.1) mock_get_cache.assert_awaited_once_with(key="tag:test-tag") mock_set_cache.assert_awaited_once() call_args = mock_set_cache.call_args cache_list = call_args.kwargs["cache_list"] assert len(cache_list) == 1 cache_key, cache_value = cache_list[0] assert cache_key == "tag:test-tag" assert cache_value["spend"] == 15.0 @pytest.mark.asyncio async def test_tag_cache_update_multiple_tags(): """ Test that multiple tags are updated in cache. """ from litellm.caching.caching import DualCache from litellm.proxy.proxy_server import user_api_key_cache cache = DualCache() setattr( litellm.proxy.proxy_server, "user_api_key_cache", cache, ) mock_tag1_obj = {"tag_name": "tag1", "spend": 10.0} mock_tag2_obj = {"tag_name": "tag2", "spend": 20.0} async def mock_get_cache_side_effect(key): if key == "tag:tag1": return mock_tag1_obj elif key == "tag:tag2": return mock_tag2_obj return None with patch.object(cache, "async_get_cache", new=AsyncMock(side_effect=mock_get_cache_side_effect)) as mock_get_cache: with patch.object(cache, "async_set_cache_pipeline", new=AsyncMock()) as mock_set_cache: await litellm.proxy.proxy_server.update_cache( token=None, user_id=None, end_user_id=None, team_id=None, response_cost=5.0, parent_otel_span=None, tags=["tag1", "tag2"], ) await asyncio.sleep(0.1) assert mock_get_cache.call_count == 2 mock_set_cache.assert_awaited_once() call_args = mock_set_cache.call_args cache_list = call_args.kwargs["cache_list"] assert len(cache_list) == 2 tag_updates = {cache_key: cache_value for cache_key, cache_value in cache_list} assert "tag:tag1" in tag_updates assert "tag:tag2" in tag_updates assert tag_updates["tag:tag1"]["spend"] == 15.0 assert tag_updates["tag:tag2"]["spend"] == 25.0 @pytest.mark.asyncio async def test_init_sso_settings_in_db(): """ Test that _init_sso_settings_in_db properly loads SSO settings from database, uppercases keys, and calls _decrypt_and_set_db_env_variables. """ from unittest.mock import AsyncMock, MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test Case 1: SSO settings exist in database mock_sso_config = MagicMock() mock_sso_config.sso_settings = { "google_client_id": "test-client-id", "google_client_secret": "test-client-secret", "microsoft_client_id": "ms-client-id", "microsoft_client_secret": "ms-client-secret", } mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock( return_value=mock_sso_config ) # Mock _decrypt_and_set_db_env_variables with patch.object( proxy_config, "_decrypt_and_set_db_env_variables" ) as mock_decrypt_and_set: await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client) # Verify find_unique was called with correct parameters mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with( where={"id": "sso_config"} ) # Verify _decrypt_and_set_db_env_variables was called with uppercased keys mock_decrypt_and_set.assert_called_once() call_args = mock_decrypt_and_set.call_args uppercased_settings = call_args.kwargs["environment_variables"] # Verify all keys are uppercased assert "GOOGLE_CLIENT_ID" in uppercased_settings assert "GOOGLE_CLIENT_SECRET" in uppercased_settings assert "MICROSOFT_CLIENT_ID" in uppercased_settings assert "MICROSOFT_CLIENT_SECRET" in uppercased_settings # Verify values are preserved assert uppercased_settings["GOOGLE_CLIENT_ID"] == "test-client-id" assert uppercased_settings["GOOGLE_CLIENT_SECRET"] == "test-client-secret" assert uppercased_settings["MICROSOFT_CLIENT_ID"] == "ms-client-id" assert uppercased_settings["MICROSOFT_CLIENT_SECRET"] == "ms-client-secret" # Verify original lowercase keys are not present assert "google_client_id" not in uppercased_settings assert "microsoft_client_id" not in uppercased_settings @pytest.mark.asyncio async def test_init_sso_settings_in_db_no_settings(): """ Test that _init_sso_settings_in_db handles the case when no SSO settings exist in database. """ from unittest.mock import AsyncMock, MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock prisma client to return None (no SSO settings) mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock(return_value=None) # Mock _decrypt_and_set_db_env_variables with patch.object( proxy_config, "_decrypt_and_set_db_env_variables" ) as mock_decrypt_and_set: await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client) # Verify find_unique was called mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with( where={"id": "sso_config"} ) # Verify _decrypt_and_set_db_env_variables was NOT called when no settings exist mock_decrypt_and_set.assert_not_called() @pytest.mark.asyncio async def test_init_sso_settings_in_db_error_handling(): """ Test that _init_sso_settings_in_db handles database errors gracefully. """ from unittest.mock import AsyncMock, MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock prisma client to raise an exception mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock( side_effect=Exception("Database connection error") ) # The method should not raise an exception, it should log it instead try: await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client) # If we get here, the exception was handled properly assert True except Exception as e: # The exception should be caught and logged, not propagated pytest.fail(f"Exception should have been caught and logged, but was raised: {e}") @pytest.mark.asyncio async def test_init_sso_settings_in_db_empty_settings(): """ Test that _init_sso_settings_in_db handles empty SSO settings dictionary. """ from unittest.mock import AsyncMock, MagicMock, patch from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock SSO config with empty settings dictionary mock_sso_config = MagicMock() mock_sso_config.sso_settings = {} mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_ssoconfig.find_unique = AsyncMock( return_value=mock_sso_config ) # Mock _decrypt_and_set_db_env_variables with patch.object( proxy_config, "_decrypt_and_set_db_env_variables" ) as mock_decrypt_and_set: await proxy_config._init_sso_settings_in_db(prisma_client=mock_prisma_client) # Verify find_unique was called mock_prisma_client.db.litellm_ssoconfig.find_unique.assert_awaited_once_with( where={"id": "sso_config"} ) # Verify _decrypt_and_set_db_env_variables was called with empty dict mock_decrypt_and_set.assert_called_once() call_args = mock_decrypt_and_set.call_args uppercased_settings = call_args.kwargs["environment_variables"] # Verify empty dictionary assert uppercased_settings == {} def test_update_config_fields_uppercases_env_vars(monkeypatch): """ Ensure environment variables pulled from DB are uppercased when applied so integrations like Datadog that expect uppercase env keys can read them. """ from litellm.proxy.proxy_server import ProxyConfig for key in ["DD_API_KEY", "DD_SITE", "dd_api_key", "dd_site"]: monkeypatch.delenv(key, raising=False) proxy_config = ProxyConfig() updated_config = proxy_config._update_config_fields( current_config={}, param_name="environment_variables", db_param_value={"dd_api_key": "test-api-key", "dd_site": "us5.datadoghq.com"}, ) env_vars = updated_config.get("environment_variables", {}) assert env_vars["DD_API_KEY"] == "test-api-key" assert env_vars["DD_SITE"] == "us5.datadoghq.com" assert os.environ.get("DD_API_KEY") == "test-api-key" assert os.environ.get("DD_SITE") == "us5.datadoghq.com" def test_get_prompt_spec_for_db_prompt_with_versions(): """ Test that _get_prompt_spec_for_db_prompt correctly converts database prompts to PromptSpec with versioned naming convention. """ from unittest.mock import MagicMock from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Mock database prompt version 1 mock_prompt_v1 = MagicMock() mock_prompt_v1.model_dump.return_value = { "id": "uuid-1", "prompt_id": "chat_prompt", "version": 1, "litellm_params": '{"prompt_id": "chat_prompt", "prompt_integration": "dotprompt", "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "v1 content"}]}', "prompt_info": '{"prompt_type": "db"}', "created_at": "2024-01-01T00:00:00", "updated_at": "2024-01-01T00:00:00", } # Mock database prompt version 2 mock_prompt_v2 = MagicMock() mock_prompt_v2.model_dump.return_value = { "id": "uuid-2", "prompt_id": "chat_prompt", "version": 2, "litellm_params": '{"prompt_id": "chat_prompt", "prompt_integration": "dotprompt", "model": "gpt-4", "messages": [{"role": "user", "content": "v2 content"}]}', "prompt_info": '{"prompt_type": "db"}', "created_at": "2024-01-02T00:00:00", "updated_at": "2024-01-02T00:00:00", } # Test version 1 prompt_spec_v1 = proxy_config._get_prompt_spec_for_db_prompt(db_prompt=mock_prompt_v1) assert prompt_spec_v1.prompt_id == "chat_prompt.v1" # Test version 2 prompt_spec_v2 = proxy_config._get_prompt_spec_for_db_prompt(db_prompt=mock_prompt_v2) assert prompt_spec_v2.prompt_id == "chat_prompt.v2" def test_root_redirect_when_docs_url_not_root_and_redirect_url_set(monkeypatch): from fastapi.responses import RedirectResponse from litellm.proxy.proxy_server import cleanup_router_config_variables from litellm.proxy.utils import _get_docs_url cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" # Ensure docs are mounted on a non-root path to trigger redirect logic monkeypatch.setenv("DOCS_URL", "/docs") test_redirect_url = "/ui" monkeypatch.setenv("ROOT_REDIRECT_URL", test_redirect_url) asyncio.run(initialize(config=config_fp, debug=True)) docs_url = _get_docs_url() root_redirect_url = os.getenv("ROOT_REDIRECT_URL") # Remove any existing "/" route that might interfere routes_to_remove = [] for route in app.routes: if hasattr(route, "path") and route.path == "/": if hasattr(route, "methods") and "GET" in route.methods: routes_to_remove.append(route) elif not hasattr(route, "methods"): # Catch-all routes routes_to_remove.append(route) for route in routes_to_remove: app.routes.remove(route) # Add the redirect route if conditions are met (matching the actual implementation) if docs_url != "/" and root_redirect_url: @app.get("/", include_in_schema=False) async def root_redirect(): return RedirectResponse(url=root_redirect_url) client = TestClient(app) response = client.get("/", follow_redirects=False) assert response.status_code == 307 assert response.headers["location"] == test_redirect_url @pytest.mark.asyncio async def test_get_image_non_root_uses_var_lib_assets_dir(monkeypatch): """ Test that get_image uses /var/lib/litellm/assets when LITELLM_NON_ROOT is true. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image # Set LITELLM_NON_ROOT to true monkeypatch.setenv("LITELLM_NON_ROOT", "true") monkeypatch.delenv("UI_LOGO_PATH", raising=False) # Mock os.path operations - exists=False for assets_dir so makedirs gets called def exists_side_effect(path): return False if path == "/var/lib/litellm/assets" else True with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \ patch("litellm.proxy.proxy_server.os.path.exists", side_effect=exists_side_effect), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \ patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response: # Setup mock_getenv to return empty string for UI_LOGO_PATH def getenv_side_effect(key, default=""): if key == "UI_LOGO_PATH": return "" elif key == "LITELLM_NON_ROOT": return "true" return default mock_getenv.side_effect = getenv_side_effect # Call the function await get_image() # Verify makedirs was called with /var/lib/litellm/assets mock_makedirs.assert_called_once_with("/var/lib/litellm/assets", exist_ok=True) @pytest.mark.asyncio async def test_get_image_non_root_fallback_to_default_logo(monkeypatch): """ Test that get_image falls back to default_site_logo when logo doesn't exist in /var/lib/litellm/assets for non-root case. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image # Set LITELLM_NON_ROOT to true monkeypatch.setenv("LITELLM_NON_ROOT", "true") monkeypatch.delenv("UI_LOGO_PATH", raising=False) # Track path.exists calls to verify it checks /var/lib/litellm/assets/logo.jpg exists_calls = [] def exists_side_effect(path): exists_calls.append(path) # Return False for /var/lib/litellm/assets* so: makedirs is called, logo fallback # triggers, and we don't return early with cached file if "/var/lib/litellm/assets" in path: return False return True # Mock os.path operations with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \ patch("litellm.proxy.proxy_server.os.path.exists", side_effect=exists_side_effect), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \ patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response: # Setup mock_getenv def getenv_side_effect(key, default=""): if key == "UI_LOGO_PATH": return "" elif key == "LITELLM_NON_ROOT": return "true" return default mock_getenv.side_effect = getenv_side_effect # Call the function await get_image() # Verify makedirs was called with /var/lib/litellm/assets mock_makedirs.assert_called_once_with("/var/lib/litellm/assets", exist_ok=True) # Verify that exists was called to check /var/lib/litellm/assets/logo.jpg assets_logo_path = "/var/lib/litellm/assets/logo.jpg" assert any(assets_logo_path in str(call) for call in exists_calls), \ f"Should check if {assets_logo_path} exists" # Verify FileResponse was called (with fallback logo) assert mock_file_response.called, "FileResponse should be called" @pytest.mark.asyncio async def test_get_image_root_case_uses_current_dir(monkeypatch): """ Test that get_image uses current_dir when LITELLM_NON_ROOT is not true. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image # Don't set LITELLM_NON_ROOT (or set it to false) monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) monkeypatch.delenv("UI_LOGO_PATH", raising=False) # Mock os.path operations with patch("litellm.proxy.proxy_server.os.makedirs") as mock_makedirs, \ patch("litellm.proxy.proxy_server.os.path.exists", return_value=True), \ patch("litellm.proxy.proxy_server.os.getenv") as mock_getenv, \ patch("litellm.proxy.proxy_server.FileResponse") as mock_file_response: # Setup mock_getenv def getenv_side_effect(key, default=""): if key == "UI_LOGO_PATH": return "" elif key == "LITELLM_NON_ROOT": return "" # Not set or empty return default mock_getenv.side_effect = getenv_side_effect # Call the function await get_image() # Verify makedirs was NOT called with /var/lib/litellm/assets (should not create it for root case) var_lib_assets_calls = [ call for call in mock_makedirs.call_args_list if "/var/lib/litellm/assets" in str(call) ] assert len(var_lib_assets_calls) == 0, "Should not create /var/lib/litellm/assets for root case" # Verify FileResponse was called assert mock_file_response.called, "FileResponse should be called" @pytest.mark.asyncio async def test_get_image_custom_local_logo_bypasses_cache(monkeypatch): """ Test that when UI_LOGO_PATH is set to a local file, get_image serves it directly and does not return a stale cached_logo.jpg. Regression test: previously the cache check ran before reading UI_LOGO_PATH, so a pre-existing cached_logo.jpg (e.g. from the base Docker image) would always be returned, ignoring the user's custom logo. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image monkeypatch.setenv("UI_LOGO_PATH", "/app/custom_logo.jpg") monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) monkeypatch.delenv("LITELLM_ASSETS_PATH", raising=False) calls_to_file_response = [] def fake_file_response(path, **kwargs): calls_to_file_response.append(path) return MagicMock() with patch("litellm.proxy.proxy_server.os.path.exists", return_value=True), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.FileResponse", side_effect=fake_file_response): await get_image() assert len(calls_to_file_response) == 1, "FileResponse should be called exactly once" assert calls_to_file_response[0] == "/app/custom_logo.jpg", ( f"Expected custom logo path, got {calls_to_file_response[0]}. " "A stale cached_logo.jpg may have been returned instead." ) @pytest.mark.asyncio async def test_get_image_default_logo_still_uses_cache(monkeypatch): """ Test that when UI_LOGO_PATH is NOT set (default logo), the cache optimization still works — cached_logo.jpg is returned if it exists. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image monkeypatch.delenv("UI_LOGO_PATH", raising=False) monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) monkeypatch.delenv("LITELLM_ASSETS_PATH", raising=False) calls_to_file_response = [] def fake_file_response(path, **kwargs): calls_to_file_response.append(path) return MagicMock() with patch("litellm.proxy.proxy_server.os.path.exists", return_value=True), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.FileResponse", side_effect=fake_file_response): await get_image() assert len(calls_to_file_response) == 1, "FileResponse should be called exactly once" served_path = calls_to_file_response[0] assert served_path.endswith("cached_logo.jpg"), ( f"Expected cached_logo.jpg for default logo, got {served_path}" ) @pytest.mark.asyncio async def test_get_image_custom_logo_missing_falls_through_to_default(monkeypatch): """ Test that when UI_LOGO_PATH points to a non-existent local file, get_image falls through to the cache/default logo instead of failing. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image monkeypatch.setenv("UI_LOGO_PATH", "/app/nonexistent_logo.jpg") monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) monkeypatch.delenv("LITELLM_ASSETS_PATH", raising=False) calls_to_file_response = [] def fake_file_response(path, **kwargs): calls_to_file_response.append(path) return MagicMock() def exists_side_effect(path): # The custom logo does NOT exist; cache and default DO exist if path == "/app/nonexistent_logo.jpg": return False return True with patch("litellm.proxy.proxy_server.os.path.exists", side_effect=exists_side_effect), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.FileResponse", side_effect=fake_file_response): await get_image() assert len(calls_to_file_response) == 1, "FileResponse should be called exactly once" served_path = calls_to_file_response[0] assert served_path != "/app/nonexistent_logo.jpg", ( "Should not attempt to serve a non-existent custom logo" ) assert served_path.endswith("cached_logo.jpg"), ( f"Expected fallback to cached_logo.jpg, got {served_path}" ) @pytest.mark.asyncio async def test_get_image_custom_logo_missing_no_cache_serves_default(monkeypatch): """ Test that when UI_LOGO_PATH points to a non-existent file AND there is no cached_logo.jpg, get_image serves the default logo instead of the non-existent custom path. """ from unittest.mock import patch from litellm.proxy.proxy_server import get_image monkeypatch.setenv("UI_LOGO_PATH", "/app/nonexistent_logo.jpg") monkeypatch.delenv("LITELLM_NON_ROOT", raising=False) monkeypatch.delenv("LITELLM_ASSETS_PATH", raising=False) calls_to_file_response = [] def fake_file_response(path, **kwargs): calls_to_file_response.append(path) return MagicMock() def exists_side_effect(path): # Neither the custom logo nor the cache exist if path == "/app/nonexistent_logo.jpg": return False if "cached_logo.jpg" in path: return False return True with patch("litellm.proxy.proxy_server.os.path.exists", side_effect=exists_side_effect), \ patch("litellm.proxy.proxy_server.os.access", return_value=True), \ patch("litellm.proxy.proxy_server.FileResponse", side_effect=fake_file_response): await get_image() assert len(calls_to_file_response) == 1, "FileResponse should be called exactly once" served_path = calls_to_file_response[0] assert served_path != "/app/nonexistent_logo.jpg", ( "Should not attempt to serve a non-existent custom logo" ) assert served_path.endswith("logo.jpg"), ( f"Expected fallback to default logo.jpg, got {served_path}" ) def test_get_config_normalizes_string_callbacks(monkeypatch): """ Test that /get/config/callbacks normalizes string callbacks to lists. """ from litellm.proxy.proxy_server import app, proxy_config, user_api_key_auth config_data = { "litellm_settings": { "success_callback": "langfuse", "failure_callback": None, "callbacks": ["prometheus", "datadog"], }, "general_settings": {}, "environment_variables": {}, } mock_router = MagicMock() mock_router.get_settings.return_value = {} monkeypatch.setattr("litellm.proxy.proxy_server.llm_router", mock_router) monkeypatch.setattr( proxy_config, "get_config", AsyncMock(return_value=config_data) ) original_overrides = app.dependency_overrides.copy() app.dependency_overrides[user_api_key_auth] = lambda: MagicMock() client = TestClient(app) try: response = client.get("/get/config/callbacks") finally: app.dependency_overrides = original_overrides assert response.status_code == 200 callbacks = response.json()["callbacks"] success_callbacks = [cb["name"] for cb in callbacks if cb.get("type") == "success"] failure_callbacks = [cb["name"] for cb in callbacks if cb.get("type") == "failure"] success_and_failure_callbacks = [ cb["name"] for cb in callbacks if cb.get("type") == "success_and_failure" ] assert "langfuse" in success_callbacks assert len(failure_callbacks) == 0 assert "prometheus" in success_and_failure_callbacks assert "datadog" in success_and_failure_callbacks def test_deep_merge_dicts_skips_none_and_empty_lists(monkeypatch): """ Test that _update_config_fields deep merge skips None values and empty lists. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() current_config = { "general_settings": { "max_parallel_requests": 10, "allowed_models": ["gpt-3.5-turbo", "gpt-4"], "nested": { "key1": "value1", "key2": "value2", }, } } db_param_value = { "max_parallel_requests": None, "allowed_models": [], "new_key": "new_value", "nested": { "key1": "updated_value1", "key3": "value3", }, } result = proxy_config._update_config_fields( current_config, "general_settings", db_param_value ) assert result["general_settings"]["max_parallel_requests"] == 10 assert result["general_settings"]["allowed_models"] == ["gpt-3.5-turbo", "gpt-4"] assert result["general_settings"]["new_key"] == "new_value" assert result["general_settings"]["nested"]["key1"] == "updated_value1" assert result["general_settings"]["nested"]["key2"] == "value2" assert result["general_settings"]["nested"]["key3"] == "value3" class TestInvitationEndpoints: """Tests for /invitation/new and /invitation/delete endpoints.""" @pytest.fixture def client_with_auth(self): """Create a test client with admin authentication.""" from litellm.proxy._types import LitellmUserRoles from litellm.proxy.proxy_server import cleanup_router_config_variables cleanup_router_config_variables() filepath = os.path.dirname(os.path.abspath(__file__)) config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml" asyncio.run(initialize(config=config_fp, debug=True)) mock_auth = MagicMock() mock_auth.user_id = "admin-user-id" mock_auth.user_role = LitellmUserRoles.PROXY_ADMIN mock_auth.api_key = "sk-test" app.dependency_overrides[user_api_key_auth] = lambda: mock_auth return TestClient(app) @pytest.mark.parametrize( "endpoint,payload,mock_return", [ ( "/invitation/new", {"user_id": "target-user-123"}, { "id": "inv-123", "user_id": "target-user-123", "is_accepted": False, "accepted_at": None, "expires_at": "2025-02-18T00:00:00", "created_at": "2025-02-11T00:00:00", "created_by": "admin-user-id", "updated_at": "2025-02-11T00:00:00", "updated_by": "admin-user-id", }, ), ( "/invitation/delete", {"invitation_id": "inv-456"}, { "id": "inv-456", "user_id": "target-user-123", "is_accepted": False, "accepted_at": None, "expires_at": "2025-02-18T00:00:00", "created_at": "2025-02-11T00:00:00", "created_by": "admin-user-id", "updated_at": "2025-02-11T00:00:00", "updated_by": "admin-user-id", }, ), ], ) def test_invitation_endpoints_proxy_admin_success( self, client_with_auth, endpoint, payload, mock_return ): """Proxy admin can successfully create and delete invitations.""" with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_invitationlink = MagicMock() if endpoint == "/invitation/new": mock_create = AsyncMock(return_value=mock_return) with patch( "litellm.proxy.management_helpers.user_invitation.create_invitation_for_user", mock_create, ): response = client_with_auth.post(endpoint, json=payload) else: mock_prisma.db.litellm_invitationlink.find_unique = AsyncMock( return_value={**mock_return, "created_by": "admin-user-id"} ) mock_prisma.db.litellm_invitationlink.delete = AsyncMock( return_value=mock_return ) response = client_with_auth.post(endpoint, json=payload) assert response.status_code == 200 data = response.json() assert data["id"] == mock_return["id"] assert data["user_id"] == mock_return["user_id"] @pytest.mark.parametrize( "endpoint,payload", [ ("/invitation/new", {"user_id": "target-user-123"}), ("/invitation/delete", {"invitation_id": "inv-456"}), ], ) def test_invitation_endpoints_non_admin_denied( self, client_with_auth, endpoint, payload ): """Non-admin users cannot access invitation endpoints.""" from litellm.proxy._types import LitellmUserRoles mock_auth = MagicMock() mock_auth.user_id = "regular-user" mock_auth.user_role = LitellmUserRoles.INTERNAL_USER mock_auth.api_key = "sk-regular" app.dependency_overrides[user_api_key_auth] = lambda: mock_auth with patch("litellm.proxy.proxy_server.prisma_client") as mock_prisma: mock_prisma.db.litellm_invitationlink = MagicMock() # Avoid triggering async DB calls in _user_has_admin_privileges with patch( "litellm.proxy.proxy_server._user_has_admin_privileges", new_callable=AsyncMock, return_value=False, ): response = client_with_auth.post(endpoint, json=payload) assert response.status_code == 400 body = response.json() # ProxyException handler returns {"error": {...}}, HTTPException returns {"detail": {...}} error_content = body.get("error", body.get("detail", body)) assert "not allowed" in str(error_content).lower() @pytest.mark.asyncio async def test_async_data_generator_cleanup_on_early_exit(): """ Test that async_data_generator calls response.aclose() in the finally block when the generator is abandoned mid-stream (client disconnect). """ from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import async_data_generator from litellm.proxy.utils import ProxyLogging mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) mock_request_data = { "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "test"}], } mock_chunks = [ {"choices": [{"delta": {"content": "Hello"}}]}, {"choices": [{"delta": {"content": " world"}}]}, {"choices": [{"delta": {"content": " more"}}]}, ] mock_proxy_logging_obj = MagicMock(spec=ProxyLogging) async def mock_streaming_iterator(*args, **kwargs): for chunk in mock_chunks: yield chunk mock_proxy_logging_obj.async_post_call_streaming_iterator_hook = ( mock_streaming_iterator ) mock_proxy_logging_obj.async_post_call_streaming_hook = AsyncMock( side_effect=lambda **kwargs: kwargs.get("response") ) mock_proxy_logging_obj.post_call_failure_hook = AsyncMock() # Create a mock response with aclose mock_response = MagicMock() mock_response.aclose = AsyncMock() with patch("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj): # Consume only the first chunk then abandon the generator (simulates client disconnect) gen = async_data_generator( mock_response, mock_user_api_key_dict, mock_request_data ) first_chunk = await gen.__anext__() assert first_chunk.startswith("data: ") # Close the generator early (simulates what ASGI does on client disconnect) await gen.aclose() # Verify aclose was called on the response to release the HTTP connection mock_response.aclose.assert_awaited_once() @pytest.mark.asyncio async def test_async_data_generator_cleanup_on_normal_completion(): """ Test that async_data_generator calls response.aclose() even on normal completion. """ from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import async_data_generator from litellm.proxy.utils import ProxyLogging mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) mock_request_data = { "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "test"}], } mock_chunks = [ {"choices": [{"delta": {"content": "Hello"}}]}, ] mock_proxy_logging_obj = MagicMock(spec=ProxyLogging) async def mock_streaming_iterator(*args, **kwargs): for chunk in mock_chunks: yield chunk mock_proxy_logging_obj.async_post_call_streaming_iterator_hook = ( mock_streaming_iterator ) mock_proxy_logging_obj.async_post_call_streaming_hook = AsyncMock( side_effect=lambda **kwargs: kwargs.get("response") ) mock_proxy_logging_obj.post_call_failure_hook = AsyncMock() mock_response = MagicMock() mock_response.aclose = AsyncMock() with patch("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj): yielded_data = [] async for data in async_data_generator( mock_response, mock_user_api_key_dict, mock_request_data ): yielded_data.append(data) # Should have completed normally with [DONE] assert any("[DONE]" in d for d in yielded_data) # aclose should still be called via finally block mock_response.aclose.assert_awaited_once() @pytest.mark.asyncio async def test_async_data_generator_cleanup_on_midstream_error(): """ Test that async_data_generator calls response.aclose() via finally block even when an exception occurs mid-stream. """ from litellm.proxy._types import UserAPIKeyAuth from litellm.proxy.proxy_server import async_data_generator from litellm.proxy.utils import ProxyLogging mock_user_api_key_dict = MagicMock(spec=UserAPIKeyAuth) mock_request_data = { "model": "gpt-3.5-turbo", "messages": [{"role": "user", "content": "test"}], } mock_proxy_logging_obj = MagicMock(spec=ProxyLogging) async def mock_streaming_iterator_with_error(*args, **kwargs): yield {"choices": [{"delta": {"content": "Hello"}}]} raise RuntimeError("upstream connection reset") mock_proxy_logging_obj.async_post_call_streaming_iterator_hook = ( mock_streaming_iterator_with_error ) mock_proxy_logging_obj.async_post_call_streaming_hook = AsyncMock( side_effect=lambda **kwargs: kwargs.get("response") ) mock_proxy_logging_obj.post_call_failure_hook = AsyncMock() mock_response = MagicMock() mock_response.aclose = AsyncMock() with patch("litellm.proxy.proxy_server.proxy_logging_obj", mock_proxy_logging_obj): yielded_data = [] async for data in async_data_generator( mock_response, mock_user_api_key_dict, mock_request_data ): yielded_data.append(data) # Should have yielded data chunk and then an error chunk assert len(yielded_data) >= 2 assert any("error" in d for d in yielded_data) # aclose must still be called via finally block despite the error mock_response.aclose.assert_awaited_once() # ============================================================================ # store_model_in_db DB Config Override Tests # ============================================================================ def test_store_model_in_db_in_config_general_settings(): """ Verify store_model_in_db is a valid field in ConfigGeneralSettings and validates correctly for True/False values. """ from litellm.proxy._types import ConfigGeneralSettings assert "store_model_in_db" in ConfigGeneralSettings.model_fields # Should validate with True config = ConfigGeneralSettings(store_model_in_db=True) assert config.store_model_in_db is True # Should validate with False config = ConfigGeneralSettings(store_model_in_db=False) assert config.store_model_in_db is False # Should validate with None (default) config = ConfigGeneralSettings(store_model_in_db=None) assert config.store_model_in_db is None # Should validate with no value config = ConfigGeneralSettings() assert config.store_model_in_db is None @pytest.mark.asyncio async def test_update_general_settings_store_model_in_db_true(): """ Verify _update_general_settings sets global store_model_in_db to True when DB general_settings has store_model_in_db=True. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() with patch( "litellm.proxy.proxy_server.store_model_in_db", False ) as mock_store, patch( "litellm.proxy.proxy_server.general_settings", {} ) as mock_gs: await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": True} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is True assert ps.general_settings["store_model_in_db"] is True @pytest.mark.asyncio async def test_update_general_settings_store_model_in_db_false(): """ Verify _update_general_settings sets global store_model_in_db to False when DB general_settings has store_model_in_db=False. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() with patch( "litellm.proxy.proxy_server.store_model_in_db", True ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": False} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is False assert ps.general_settings["store_model_in_db"] is False @pytest.mark.asyncio async def test_update_general_settings_store_model_in_db_string_normalization(): """ Verify _update_general_settings normalizes string values for store_model_in_db. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # Test "true" string with patch( "litellm.proxy.proxy_server.store_model_in_db", False ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": "true"} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is True # Test "True" string with patch( "litellm.proxy.proxy_server.store_model_in_db", False ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": "True"} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is True # Test "false" string with patch( "litellm.proxy.proxy_server.store_model_in_db", True ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": "false"} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is False @pytest.mark.asyncio async def test_update_general_settings_store_model_in_db_none_keeps_current(): """ Verify _update_general_settings does not change store_model_in_db when DB value is None. """ from litellm.proxy.proxy_server import ProxyConfig proxy_config = ProxyConfig() # When current is True and DB sends None, should stay True with patch( "litellm.proxy.proxy_server.store_model_in_db", True ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": None} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is True # When current is False and DB sends None, should stay False with patch( "litellm.proxy.proxy_server.store_model_in_db", False ), patch("litellm.proxy.proxy_server.general_settings", {}): await proxy_config._update_general_settings( db_general_settings={"store_model_in_db": None} ) import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is False @pytest.mark.asyncio async def test_store_model_in_db_db_override_when_config_false(): """ Verify the early DB check in initialize_scheduled_background_jobs overrides store_model_in_db=False when DB has True. """ from litellm.proxy.proxy_server import ProxyStartupEvent from litellm.proxy.utils import ProxyLogging mock_prisma_client = MagicMock() # Mock DB returning store_model_in_db=True in general_settings mock_db_record = MagicMock() mock_db_record.param_value = {"store_model_in_db": True} mock_prisma_client.db.litellm_config.find_first = AsyncMock( return_value=mock_db_record ) mock_proxy_logging = MagicMock(spec=ProxyLogging) mock_proxy_logging.slack_alerting_instance = MagicMock() mock_proxy_config = AsyncMock() with patch( "litellm.proxy.proxy_server.proxy_config", mock_proxy_config ), patch( "litellm.proxy.proxy_server.store_model_in_db", False ), patch( "litellm.proxy.proxy_server.get_secret_bool", return_value=False ): await ProxyStartupEvent.initialize_scheduled_background_jobs( general_settings={}, prisma_client=mock_prisma_client, proxy_budget_rescheduler_min_time=1, proxy_budget_rescheduler_max_time=2, proxy_batch_write_at=5, proxy_logging_obj=mock_proxy_logging, ) import litellm.proxy.proxy_server as ps # store_model_in_db should now be True (overridden by DB) assert ps.store_model_in_db is True # add_deployment and get_credentials should have been called # since store_model_in_db is now True assert mock_proxy_config.add_deployment.call_count == 1 assert mock_proxy_config.get_credentials.call_count == 1 @pytest.mark.asyncio async def test_store_model_in_db_db_check_skipped_when_already_true(monkeypatch): """ Verify the early DB check is skipped when store_model_in_db is already True. The DB query for the early check should not be called. """ monkeypatch.delenv("STORE_MODEL_IN_DB", raising=False) from litellm.proxy.proxy_server import ProxyStartupEvent from litellm.proxy.utils import ProxyLogging mock_prisma_client = MagicMock() mock_prisma_client.db.litellm_config.find_first = AsyncMock(return_value=None) mock_proxy_logging = MagicMock(spec=ProxyLogging) mock_proxy_logging.slack_alerting_instance = MagicMock() mock_proxy_config = AsyncMock() with patch( "litellm.proxy.proxy_server.proxy_config", mock_proxy_config ), patch( "litellm.proxy.proxy_server.store_model_in_db", True ), patch( "litellm.proxy.proxy_server.get_secret_bool", return_value=True ): await ProxyStartupEvent.initialize_scheduled_background_jobs( general_settings={}, prisma_client=mock_prisma_client, proxy_budget_rescheduler_min_time=1, proxy_budget_rescheduler_max_time=2, proxy_batch_write_at=5, proxy_logging_obj=mock_proxy_logging, ) # The early DB check uses find_first with param_name="general_settings". # When store_model_in_db is already True, the early check should be skipped. # However, add_deployment may also call find_first. # We just verify that store_model_in_db stays True and jobs are scheduled. import litellm.proxy.proxy_server as ps assert ps.store_model_in_db is True assert mock_proxy_config.add_deployment.call_count == 1 @pytest.mark.asyncio async def test_store_model_in_db_db_failure_graceful(monkeypatch): """ Verify the early DB check handles DB failures gracefully without crashing and keeps store_model_in_db as False. """ monkeypatch.delenv("STORE_MODEL_IN_DB", raising=False) from litellm.proxy.proxy_server import ProxyStartupEvent from litellm.proxy.utils import ProxyLogging mock_prisma_client = MagicMock() # Simulate DB failure mock_prisma_client.db.litellm_config.find_first = AsyncMock( side_effect=Exception("DB connection error") ) mock_proxy_logging = MagicMock(spec=ProxyLogging) mock_proxy_logging.slack_alerting_instance = MagicMock() mock_proxy_config = AsyncMock() with patch( "litellm.proxy.proxy_server.proxy_config", mock_proxy_config ), patch( "litellm.proxy.proxy_server.store_model_in_db", False ), patch( "litellm.proxy.proxy_server.get_secret_bool", return_value=False ): # Should not raise an exception await ProxyStartupEvent.initialize_scheduled_background_jobs( general_settings={}, prisma_client=mock_prisma_client, proxy_budget_rescheduler_min_time=1, proxy_budget_rescheduler_max_time=2, proxy_batch_write_at=5, proxy_logging_obj=mock_proxy_logging, ) import litellm.proxy.proxy_server as ps # store_model_in_db should remain False assert ps.store_model_in_db is False # add_deployment should NOT have been called since store_model_in_db is False mock_proxy_config.add_deployment.assert_not_called()