Files
litellm/tests/test_litellm/llms/test_volcengine.py
T
Krish Dholakia 24c2cd1bd9 Anthropic /v1/messages - Custom LLM Server support (#12016)
* fix(handler.py): support routing custom llm's to chat completion handler

Adds custom llm support for anthropic

* test(test_anthropic_experimental_pass_through_messages_handler.py): add unit test confirming custom llm respected

* docs(custom_llm_server.md): document anthropic custom llm translation

* test(volcengine.py): map thinking in extra body

Fixes https://github.com/BerriAI/litellm/issues/11879

* feat(main.py): support `azure/responses/<deployment-name>` model string

this allows us to route the model correctly

Closes https://github.com/BerriAI/litellm/issues/11879

* docs(azure_responses.md): document calling azure responses api models via chat completions bridge

Closes https://github.com/BerriAI/litellm/issues/11917

* fix: fix custom provider check

* test: update tests
2025-06-24 22:00:44 -07:00

84 lines
2.5 KiB
Python

import os
import sys
from unittest.mock import MagicMock, patch
from pydantic import BaseModel
from litellm.llms.volcengine import VolcEngineConfig
from litellm.utils import get_optional_params
class TestVolcEngineConfig:
def test_get_optional_params(self):
config = VolcEngineConfig()
supported_params = config.get_supported_openai_params(model="doubao-seed-1.6")
assert "thinking" in supported_params
mapped_params = config.map_openai_params(
non_default_params={
"thinking": {"type": "disabled"},
},
optional_params={},
model="doubao-seed-1.6",
drop_params=False,
)
assert mapped_params == {
"extra_body": {
"thinking": {"type": "disabled"},
}
}
e2e_mapped_params = get_optional_params(
model="doubao-seed-1.6",
custom_llm_provider="volcengine",
thinking={"type": "enabled"},
drop_params=False,
)
assert "thinking" in e2e_mapped_params["extra_body"] and e2e_mapped_params[
"extra_body"
]["thinking"] == {
"type": "enabled",
}
def test_e2e_completion(self):
from openai import OpenAI
from litellm import completion
from litellm.types.utils import ModelResponse
client = OpenAI(api_key="test_api_key")
mock_raw_response = MagicMock()
mock_raw_response.headers = {
"x-request-id": "123",
"openai-organization": "org-123",
"x-ratelimit-limit-requests": "100",
"x-ratelimit-remaining-requests": "99",
}
mock_raw_response.parse.return_value = ModelResponse()
with patch.object(
client.chat.completions.with_raw_response, "create", mock_raw_response
) as mock_create:
completion(
model="volcengine/doubao-seed-1.6",
messages=[
{
"role": "system",
"content": "**Tell me your model detail information.**",
}
],
user="guest",
stream=True,
thinking={"type": "disabled"},
client=client,
)
mock_create.assert_called_once()
print(mock_create.call_args.kwargs)
assert mock_create.call_args.kwargs["extra_body"] == {
"thinking": {"type": "disabled"},
}