fix: remove max_tokens from az ai client create call when stream=True (#5860)

This commit is contained in:
Eric Zhu 2025-03-06 17:18:37 -08:00 committed by GitHub
parent 05b14f197a
commit ea89a84c30
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -404,9 +404,7 @@ class AzureAIChatCompletionClient(ChatCompletionClient):
self._client.complete(messages=azure_messages, tools=converted_tools, stream=True, **create_args)
)
else:
task = asyncio.create_task(
self._client.complete(messages=azure_messages, max_tokens=20, stream=True, **create_args)
)
task = asyncio.create_task(self._client.complete(messages=azure_messages, stream=True, **create_args))
if cancellation_token is not None:
cancellation_token.link_future(task)