mirror of
https://github.com/tiennm99/litellm.git
synced 2026-07-04 01:06:45 +00:00
Fix token_counter with special token input
This commit is contained in:
@@ -529,7 +529,7 @@ def _get_count_function(
|
||||
encoding = tiktoken.get_encoding("cl100k_base")
|
||||
|
||||
def count_tokens(text: str) -> int:
|
||||
return len(encoding.encode(text))
|
||||
return len(encoding.encode(text, disallowed_special=()))
|
||||
|
||||
else:
|
||||
raise ValueError("Unsupported tokenizer type")
|
||||
|
||||
@@ -451,6 +451,7 @@ def test_img_url_token_counter(img_url):
|
||||
|
||||
def test_token_encode_disallowed_special():
|
||||
encode(model="gpt-3.5-turbo", text="Hello, world! <|endoftext|>")
|
||||
token_counter(model="gpt-3.5-turbo", text="Hello, world! <|endoftext|>")
|
||||
|
||||
|
||||
def test_token_counter():
|
||||
|
||||
Reference in New Issue
Block a user