mirror of
https://github.com/tiennm99/litellm.git
synced 2026-06-17 22:48:35 +00:00
bc26845ec4
* [Feat] Add native litellm.ocr() functions (#15567) * fix get_supported_ocr_params * add get_provider_ocr_config * init OCR * init ocr functions * add OCRResponse Base Model * add ocr to llm http handlers * add main.py for OCR * fix linting for OCR * TestMistralOCR * update to use DocumentType for Mistral * fix _prepare_ocr_request * fix transform * add main.py for OCR * add spec to init * fix OCR * TestMistralOCR * ruff fix * Potential fix for code scanning alert no. 3521: Clear-text logging of sensitive information Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> --------- Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com> * [Feat] Add /ocr route on LiteLLM AI Gateway - Adds support for native mistral ocr calling (#15571) * fix get_supported_ocr_params * add get_provider_ocr_config * init OCR * init ocr functions * add OCRResponse Base Model * add ocr to llm http handlers * add main.py for OCR * fix linting for OCR * TestMistralOCR * update to use DocumentType for Mistral * fix _prepare_ocr_request * fix transform * add main.py for OCR * add spec to init * fix OCR * TestMistralOCR * ruff fix * add router.ocr() methods * add OCR routes * feat add ocr routes * add OCR routes * feat: add OCR routes in proxy server * working /ocr routes * test_router_aocr_with_mistral * docs Mistral OCR * docs OCR * [Feat] Add Azure AI Mistral OCR Integration (#15572) * fix get_supported_ocr_params * add get_provider_ocr_config * init OCR * init ocr functions * add OCRResponse Base Model * add ocr to llm http handlers * add main.py for OCR * fix linting for OCR * TestMistralOCR * update to use DocumentType for Mistral * fix _prepare_ocr_request * fix transform * add main.py for OCR * add spec to init * fix OCR * TestMistralOCR * ruff fix * add router.ocr() methods * add OCR routes * feat add ocr routes * add OCR routes * feat: add OCR routes in proxy server * working /ocr routes * test_router_aocr_with_mistral * docs Mistral OCR * docs OCR * add azure ai to get_provider_ocr_config * add AzureAIOCRConfig * TestAzureAIOCR * TestAzureAIOCR * test fixes for azure ai ocr * fix async OCR transform for Azure * fix transform_ocr_request --------- Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>
89 lines
3.0 KiB
Python
89 lines
3.0 KiB
Python
"""
|
|
Test OCR functionality with Mistral API.
|
|
"""
|
|
import os
|
|
import sys
|
|
import pytest
|
|
import litellm
|
|
from litellm import Router
|
|
from base_ocr_unit_tests import BaseOCRTest, TEST_PDF_URL
|
|
|
|
|
|
class TestMistralOCR(BaseOCRTest):
|
|
"""
|
|
Test class for Mistral OCR functionality.
|
|
"""
|
|
|
|
def get_base_ocr_call_args(self) -> dict:
|
|
"""Return the base OCR call args for Mistral"""
|
|
return {
|
|
"model": "mistral/mistral-ocr-latest",
|
|
"api_key": os.getenv("MISTRAL_API_KEY"),
|
|
}
|
|
|
|
@pytest.mark.asyncio
|
|
async def test_router_aocr_with_mistral():
|
|
"""
|
|
Test OCR with Router using Mistral OCR deployment.
|
|
"""
|
|
litellm.set_verbose = True
|
|
|
|
# Create router with Mistral OCR deployment
|
|
router = Router(
|
|
model_list=[
|
|
{
|
|
"model_name": "mistral-ocr",
|
|
"litellm_params": {
|
|
"model": "mistral/mistral-ocr-latest",
|
|
"api_key": os.getenv("MISTRAL_API_KEY"),
|
|
},
|
|
}
|
|
]
|
|
)
|
|
|
|
try:
|
|
# Call OCR through router
|
|
response = await router.aocr(
|
|
model="mistral-ocr",
|
|
document={
|
|
"type": "document_url",
|
|
"document_url": TEST_PDF_URL
|
|
},
|
|
)
|
|
|
|
print(f"\n{'='*80}")
|
|
print("Router OCR Test")
|
|
print(f"Response type: {type(response)}")
|
|
print(f"Response object: {response.object if hasattr(response, 'object') else 'N/A'}")
|
|
|
|
# Check if response has expected Mistral OCR format
|
|
assert hasattr(response, "pages"), "Response should have 'pages' attribute"
|
|
assert hasattr(response, "model"), "Response should have 'model' attribute"
|
|
assert hasattr(response, "object"), "Response should have 'object' attribute"
|
|
assert response.object == "ocr", f"Expected object='ocr', got '{response.object}'"
|
|
|
|
# Validate pages structure
|
|
assert isinstance(response.pages, list), "pages should be a list"
|
|
assert len(response.pages) > 0, "Should have at least one page"
|
|
|
|
# Check first page structure
|
|
first_page = response.pages[0]
|
|
assert hasattr(first_page, "index"), "Page should have 'index' attribute"
|
|
assert hasattr(first_page, "markdown"), "Page should have 'markdown' attribute"
|
|
|
|
# Extract text from all pages for validation
|
|
total_text = "\n\n".join(page.markdown for page in response.pages if page.markdown)
|
|
print(f"Total pages: {len(response.pages)}")
|
|
print(f"Total extracted text length: {len(total_text)} characters")
|
|
print(f"First 200 chars: {total_text[:200]}")
|
|
print(f"Model: {response.model}")
|
|
if response.usage_info:
|
|
print(f"Pages processed: {response.usage_info.pages_processed}")
|
|
print(f"{'='*80}\n")
|
|
|
|
assert len(total_text) > 0, "Should extract some text from the document"
|
|
|
|
except Exception as e:
|
|
pytest.fail(f"Router OCR call failed: {str(e)}")
|
|
|