@@ -213,8 +213,12 @@ async def test_gpt_oss_multi_turn_chat(gptoss_client: OpenAI,
213213
214214
215215MODEL_NAME = "openai-community/gpt2"
216+ MODEL_NAME_SHORT = "gpt2"
216217CHAT_TEMPLATE = "Dummy chat template for testing {}"
217- BASE_MODEL_PATHS = [BaseModelPath (name = MODEL_NAME , model_path = MODEL_NAME )]
218+ BASE_MODEL_PATHS = [
219+ BaseModelPath (name = MODEL_NAME , model_path = MODEL_NAME ),
220+ BaseModelPath (name = MODEL_NAME_SHORT , model_path = MODEL_NAME_SHORT )
221+ ]
218222
219223
220224@dataclass
@@ -270,6 +274,42 @@ def test_async_serving_chat_init():
270274 assert serving_completion .chat_template == CHAT_TEMPLATE
271275
272276
277+ @pytest .mark .asyncio
278+ async def test_serving_chat_returns_correct_model_name ():
279+ mock_engine = MagicMock (spec = MQLLMEngineClient )
280+ mock_engine .get_tokenizer .return_value = get_tokenizer (MODEL_NAME )
281+ mock_engine .errored = False
282+
283+ models = OpenAIServingModels (engine_client = mock_engine ,
284+ base_model_paths = BASE_MODEL_PATHS ,
285+ model_config = MockModelConfig ())
286+ serving_chat = OpenAIServingChat (mock_engine ,
287+ MockModelConfig (),
288+ models ,
289+ response_role = "assistant" ,
290+ chat_template = CHAT_TEMPLATE ,
291+ chat_template_content_format = "auto" ,
292+ request_logger = None )
293+ messages = [{"role" : "user" , "content" : "what is 1+1?" }]
294+
295+ async def return_model_name (* args ):
296+ return args [3 ]
297+
298+ serving_chat .chat_completion_full_generator = return_model_name
299+
300+ # Test that full name is returned when short name is requested
301+ req = ChatCompletionRequest (model = MODEL_NAME_SHORT , messages = messages )
302+ assert await serving_chat .create_chat_completion (req ) == MODEL_NAME
303+
304+ # Test that full name is returned when empty string is specified
305+ req = ChatCompletionRequest (model = "" , messages = messages )
306+ assert await serving_chat .create_chat_completion (req ) == MODEL_NAME
307+
308+ # Test that full name is returned when no model is specified
309+ req = ChatCompletionRequest (messages = messages )
310+ assert await serving_chat .create_chat_completion (req ) == MODEL_NAME
311+
312+
273313@pytest .mark .asyncio
274314async def test_serving_chat_should_set_correct_max_tokens ():
275315 mock_engine = MagicMock (spec = MQLLMEngineClient )
0 commit comments