import unittest
from fastdeploy.entrypoints.openai.protocol import ChatCompletionRequest
from fastdeploy.reasoning.qwen3_reasoning_parsers import Qwen3ReasoningParser
class MockTokenizer:
"""Minimal tokenizer with vocab for testing."""
def __init__(self):
self.vocab = {
"": 100,
"": 101,
}
def get_vocab(self):
"""Return vocab dict for testing."""
return self.vocab
class MissingTokenTokenizer:
def __init__(self):
self.vocab = {
"": 100,
}
def get_vocab(self):
"""Return vocab dict for testing."""
return self.vocab
class TestQwen3ReasoningParser(unittest.TestCase):
def setUp(self):
self.parser = Qwen3ReasoningParser(MockTokenizer())
self.request = ChatCompletionRequest(model="test", messages=[{"role": "user", "content": "test message"}])
self.tokenizer = MockTokenizer()
def test_missing_token(self):
with self.assertRaises(RuntimeError) as context:
Qwen3ReasoningParser(MissingTokenTokenizer())
exception_message = str(context.exception)
expected_message_part = "Qwen3 reasoning parser could not find the following token ids"
self.assertIn(expected_message_part, exception_message)
def test_get_model_status(self):
status = self.parser.get_model_status([1, 2, 100])
self.assertEqual(status, "think_start")
status = self.parser.get_model_status([1, 2, 101])
self.assertEqual(status, "think_end")
status = self.parser.get_model_status([1])
self.assertEqual(status, "think_start")
def test_streaming_thinking_content(self):
msg = self.parser.extract_reasoning_content_streaming(
previous_text="",
current_text="a",
delta_text="a",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[200],
model_status="think_start",
)
self.assertEqual(msg.reasoning_content, "a")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="",
current_text="ab",
delta_text="ab",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[99, 101, 102],
model_status="think_start",
)
self.assertEqual(msg.reasoning_content, "a")
self.assertEqual(msg.content, "b")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="a",
current_text="ab",
delta_text="b",
previous_token_ids=[1, 101],
current_token_ids=[],
delta_token_ids=[102],
model_status="think_start",
)
self.assertEqual(msg.content, "b")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="",
current_text="a",
delta_text="a",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[],
model_status="think_start",
)
self.assertEqual(msg.reasoning_content, "a")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="",
current_text="a",
delta_text="a",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[200],
model_status="think_end",
)
self.assertEqual(msg.content, "a")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="hello",
current_text="hellohi",
delta_text="hi",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[101, 200],
model_status="think_start",
)
self.assertEqual(msg.content, "hi")
self.assertEqual(msg.reasoning_content, "")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="hello",
current_text="hellohi",
delta_text="hi",
previous_token_ids=[100],
current_token_ids=[],
delta_token_ids=[],
model_status="think_start",
)
self.assertEqual(msg.content, None)
self.assertEqual(msg.reasoning_content, "hi")
msg = self.parser.extract_reasoning_content_streaming(
previous_text="hello",
current_text="hellohi",
delta_text="hi",
previous_token_ids=[],
current_token_ids=[],
delta_token_ids=[100, 200],
model_status="think_start",
)
self.assertEqual(msg.content, "")
self.assertEqual(msg.reasoning_content, "hi")
def test_none_streaming_thinking_content(self):
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="a",
request={},
model_status="think_start",
)
self.assertEqual(reasoning_content, None)
self.assertEqual(content, "a")
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="ab",
request={},
model_status="think_start",
)
self.assertEqual(reasoning_content, "a")
self.assertEqual(content, "b")
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="a",
request={},
model_status="think_end",
)
self.assertEqual(reasoning_content, None)
self.assertEqual(content, "a")
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="a",
request={},
model_status="think_start",
)
self.assertEqual(reasoning_content, None)
self.assertEqual(content, "a")
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="ab",
request={},
model_status="think_start",
)
self.assertEqual(reasoning_content, "a")
self.assertEqual(content, "b")
reasoning_content, content = self.parser.extract_reasoning_content(
model_output="b",
request={},
model_status="think_start",
)
self.assertEqual(reasoning_content, "")
self.assertEqual(content, "b")
if __name__ == "__main__":
unittest.main()