We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2df2ff4 commit fe3814fCopy full SHA for fe3814f
vllm/entrypoints/openai/serving_chat.py
@@ -1003,15 +1003,7 @@ async def chat_completion_stream_generator(
1003
# handle tool calls after reasoning is done or when tool call
1004
# tokens are detected
1005
else:
1006
- # If entering here due to tool call detection, mark
1007
- # reasoning as ended and prepare state for tool parsing
1008
- if not reasoning_end_arr[i]:
1009
- reasoning_end_arr[i] = True
1010
- if not added_content_delta_arr[i]:
1011
- added_content_delta_arr[i] = True
1012
- previous_text = ""
1013
- previous_token_ids = []
1014
-
+ reasoning_end_arr[i] = True
1015
delta_token_ids = output_token_ids
1016
# First time to tool call,
1017
# add the remaining text and token ids
0 commit comments