Upload 4 files
Browse files- config.json +4 -5
- generation_config.json +0 -2
- qwen3_xml_tool_parser.py +675 -0
    	
        config.json
    CHANGED
    
    | @@ -1,9 +1,8 @@ | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "architectures": [
         | 
| 3 | 
            -
                " | 
| 4 | 
             
              ],
         | 
| 5 | 
             
              "attention_dropout": 0.0,
         | 
| 6 | 
            -
              "bos_token_id": 151643,
         | 
| 7 | 
             
              "decoder_sparse_step": 1,
         | 
| 8 | 
             
              "eos_token_id": 151645,
         | 
| 9 | 
             
              "head_dim": 128,
         | 
| @@ -12,9 +11,9 @@ | |
| 12 | 
             
              "initializer_range": 0.02,
         | 
| 13 | 
             
              "intermediate_size": 8192,
         | 
| 14 | 
             
              "max_position_embeddings": 262144,
         | 
| 15 | 
            -
              "max_window_layers":  | 
| 16 | 
             
              "mlp_only_layers": [],
         | 
| 17 | 
            -
              "model_type": " | 
| 18 | 
             
              "moe_intermediate_size": 2560,
         | 
| 19 | 
             
              "norm_topk_prob": true,
         | 
| 20 | 
             
              "num_attention_heads": 96,
         | 
| @@ -32,7 +31,7 @@ | |
| 32 | 
             
              "sliding_window": null,
         | 
| 33 | 
             
              "tie_word_embeddings": false,
         | 
| 34 | 
             
              "torch_dtype": "bfloat16",
         | 
| 35 | 
            -
              "transformers_version": "4. | 
| 36 | 
             
              "use_cache": true,
         | 
| 37 | 
             
              "use_qk_norm": true,
         | 
| 38 | 
             
              "use_sliding_window": false,
         | 
|  | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "architectures": [
         | 
| 3 | 
            +
                "Qwen3MoeForCausalLM"
         | 
| 4 | 
             
              ],
         | 
| 5 | 
             
              "attention_dropout": 0.0,
         | 
|  | |
| 6 | 
             
              "decoder_sparse_step": 1,
         | 
| 7 | 
             
              "eos_token_id": 151645,
         | 
| 8 | 
             
              "head_dim": 128,
         | 
|  | |
| 11 | 
             
              "initializer_range": 0.02,
         | 
| 12 | 
             
              "intermediate_size": 8192,
         | 
| 13 | 
             
              "max_position_embeddings": 262144,
         | 
| 14 | 
            +
              "max_window_layers": 62,
         | 
| 15 | 
             
              "mlp_only_layers": [],
         | 
| 16 | 
            +
              "model_type": "qwen3_moe",
         | 
| 17 | 
             
              "moe_intermediate_size": 2560,
         | 
| 18 | 
             
              "norm_topk_prob": true,
         | 
| 19 | 
             
              "num_attention_heads": 96,
         | 
|  | |
| 31 | 
             
              "sliding_window": null,
         | 
| 32 | 
             
              "tie_word_embeddings": false,
         | 
| 33 | 
             
              "torch_dtype": "bfloat16",
         | 
| 34 | 
            +
              "transformers_version": "4.51.0",
         | 
| 35 | 
             
              "use_cache": true,
         | 
| 36 | 
             
              "use_qk_norm": true,
         | 
| 37 | 
             
              "use_sliding_window": false,
         | 
    	
        generation_config.json
    CHANGED
    
    | @@ -1,5 +1,4 @@ | |
| 1 | 
             
            {
         | 
| 2 | 
            -
              "bos_token_id": 151643,
         | 
| 3 | 
             
              "pad_token_id": 151643,
         | 
| 4 | 
             
              "do_sample": true,
         | 
| 5 | 
             
              "eos_token_id": [
         | 
| @@ -7,7 +6,6 @@ | |
| 7 | 
             
                151643
         | 
| 8 | 
             
              ],
         | 
| 9 | 
             
              "repetition_penalty": 1.05,
         | 
| 10 | 
            -
              "presence_penalty": 0.0,
         | 
| 11 | 
             
              "temperature": 0.7,
         | 
| 12 | 
             
              "top_p": 0.8,
         | 
| 13 | 
             
              "top_k": 20
         | 
|  | |
| 1 | 
             
            {
         | 
|  | |
| 2 | 
             
              "pad_token_id": 151643,
         | 
| 3 | 
             
              "do_sample": true,
         | 
| 4 | 
             
              "eos_token_id": [
         | 
|  | |
| 6 | 
             
                151643
         | 
| 7 | 
             
              ],
         | 
| 8 | 
             
              "repetition_penalty": 1.05,
         | 
|  | |
| 9 | 
             
              "temperature": 0.7,
         | 
| 10 | 
             
              "top_p": 0.8,
         | 
| 11 | 
             
              "top_k": 20
         | 
    	
        qwen3_xml_tool_parser.py
    ADDED
    
    | @@ -0,0 +1,675 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            # SPDX-License-Identifier: Apache-2.0
         | 
| 2 | 
            +
             | 
| 3 | 
            +
            import json
         | 
| 4 | 
            +
            import re
         | 
| 5 | 
            +
            import uuid
         | 
| 6 | 
            +
            from collections.abc import Sequence
         | 
| 7 | 
            +
            from typing import Union, Optional, Any, List, Dict
         | 
| 8 | 
            +
            from enum import Enum
         | 
| 9 | 
            +
             | 
| 10 | 
            +
            from vllm.entrypoints.openai.protocol import (
         | 
| 11 | 
            +
                ChatCompletionRequest,
         | 
| 12 | 
            +
                ChatCompletionToolsParam,
         | 
| 13 | 
            +
                DeltaMessage,
         | 
| 14 | 
            +
                DeltaToolCall,
         | 
| 15 | 
            +
                DeltaFunctionCall,
         | 
| 16 | 
            +
                ExtractedToolCallInformation,
         | 
| 17 | 
            +
                FunctionCall,
         | 
| 18 | 
            +
                ToolCall,
         | 
| 19 | 
            +
            )
         | 
| 20 | 
            +
            from vllm.entrypoints.openai.tool_parsers.abstract_tool_parser import (
         | 
| 21 | 
            +
                ToolParser,
         | 
| 22 | 
            +
                ToolParserManager,
         | 
| 23 | 
            +
            )
         | 
| 24 | 
            +
            from vllm.logger import init_logger
         | 
| 25 | 
            +
            from vllm.transformers_utils.tokenizer import AnyTokenizer
         | 
| 26 | 
            +
             | 
| 27 | 
            +
            logger = init_logger(__name__)
         | 
| 28 | 
            +
             | 
| 29 | 
            +
             | 
| 30 | 
            +
            @ToolParserManager.register_module("qwen3_xml")
         | 
| 31 | 
            +
            class Qwen3XMLToolParser(ToolParser):
         | 
| 32 | 
            +
                def __init__(self, tokenizer: AnyTokenizer):
         | 
| 33 | 
            +
                    super().__init__(tokenizer)
         | 
| 34 | 
            +
             | 
| 35 | 
            +
                    self.current_tool_name_sent: bool = False
         | 
| 36 | 
            +
                    self.prev_tool_call_arr: list[dict] = []
         | 
| 37 | 
            +
                    self.current_tool_id: int = -1
         | 
| 38 | 
            +
                    self.streamed_args_for_tool: list[str] = []
         | 
| 39 | 
            +
             | 
| 40 | 
            +
                    # Sentinel tokens for streaming mode
         | 
| 41 | 
            +
                    self.tool_call_start_token: str = "<tool_call>"
         | 
| 42 | 
            +
                    self.tool_call_end_token: str = "</tool_call>"
         | 
| 43 | 
            +
                    self.tool_call_prefix: str = "<function="
         | 
| 44 | 
            +
                    self.function_end_token: str = "</function>"
         | 
| 45 | 
            +
                    self.parameter_prefix: str = "<parameter="
         | 
| 46 | 
            +
                    self.parameter_end_token: str = "</parameter>"
         | 
| 47 | 
            +
                    self.is_tool_call_started: bool = False
         | 
| 48 | 
            +
                    self.failed_count: int = 0
         | 
| 49 | 
            +
             | 
| 50 | 
            +
                    # Enhanced streaming state - reset for each new message
         | 
| 51 | 
            +
                    self._reset_streaming_state()
         | 
| 52 | 
            +
             | 
| 53 | 
            +
                    # Regex patterns
         | 
| 54 | 
            +
                    self.tool_call_complete_regex = re.compile(
         | 
| 55 | 
            +
                        r"<tool_call>(.*?)</tool_call>", re.DOTALL
         | 
| 56 | 
            +
                    )
         | 
| 57 | 
            +
                    self.tool_call_regex = re.compile(
         | 
| 58 | 
            +
                        r"<tool_call>(.*?)</tool_call>|<tool_call>(.*?)$", re.DOTALL
         | 
| 59 | 
            +
                    )
         | 
| 60 | 
            +
                    self.tool_call_function_regex = re.compile(
         | 
| 61 | 
            +
                        r"<function=(.*?)</function>|<function=(.*)$", re.DOTALL
         | 
| 62 | 
            +
                    )
         | 
| 63 | 
            +
                    self.tool_call_parameter_regex = re.compile(
         | 
| 64 | 
            +
                        r"<parameter=(.*?)</parameter>|<parameter=(.*?)$", re.DOTALL
         | 
| 65 | 
            +
                    )
         | 
| 66 | 
            +
             | 
| 67 | 
            +
                    if not self.model_tokenizer:
         | 
| 68 | 
            +
                        raise ValueError(
         | 
| 69 | 
            +
                            "The model tokenizer must be passed to the ToolParser "
         | 
| 70 | 
            +
                            "constructor during construction."
         | 
| 71 | 
            +
                        )
         | 
| 72 | 
            +
             | 
| 73 | 
            +
                    self.tool_call_start_token_id = self.vocab.get(self.tool_call_start_token)
         | 
| 74 | 
            +
                    self.tool_call_end_token_id = self.vocab.get(self.tool_call_end_token)
         | 
| 75 | 
            +
             | 
| 76 | 
            +
                    if self.tool_call_start_token_id is None or self.tool_call_end_token_id is None:
         | 
| 77 | 
            +
                        raise RuntimeError(
         | 
| 78 | 
            +
                            "Qwen3 XML Tool parser could not locate tool call start/end "
         | 
| 79 | 
            +
                            "tokens in the tokenizer!"
         | 
| 80 | 
            +
                        )
         | 
| 81 | 
            +
             | 
| 82 | 
            +
                    logger.info(f"vLLM Successfully import tool parser {self.__class__.__name__} !")
         | 
| 83 | 
            +
             | 
| 84 | 
            +
                def _generate_tool_call_id(self) -> str:
         | 
| 85 | 
            +
                    """Generate a unique tool call ID."""
         | 
| 86 | 
            +
                    return f"call_{uuid.uuid4().hex[:24]}"
         | 
| 87 | 
            +
             | 
| 88 | 
            +
                def _reset_streaming_state(self):
         | 
| 89 | 
            +
                    """Reset all streaming state."""
         | 
| 90 | 
            +
                    self.current_tool_index = 0
         | 
| 91 | 
            +
                    self.is_tool_call_started = False
         | 
| 92 | 
            +
                    self.header_sent = False
         | 
| 93 | 
            +
                    self.current_tool_id = None
         | 
| 94 | 
            +
                    self.current_function_name = None
         | 
| 95 | 
            +
                    self.current_param_name = None
         | 
| 96 | 
            +
                    self.current_param_value = ""
         | 
| 97 | 
            +
                    self.param_count = 0
         | 
| 98 | 
            +
                    self.in_param = False
         | 
| 99 | 
            +
                    self.in_function = False
         | 
| 100 | 
            +
                    self.accumulated_text = ""
         | 
| 101 | 
            +
                    self.json_started = False
         | 
| 102 | 
            +
                    self.json_closed = False
         | 
| 103 | 
            +
             | 
| 104 | 
            +
                def _parse_xml_function_call(
         | 
| 105 | 
            +
                    self, function_call_str: str, tools: Optional[list[ChatCompletionToolsParam]]
         | 
| 106 | 
            +
                ) -> Optional[ToolCall]:
         | 
| 107 | 
            +
                    def get_arguments_config(func_name: str) -> dict:
         | 
| 108 | 
            +
                        if tools is None:
         | 
| 109 | 
            +
                            return {}
         | 
| 110 | 
            +
                        for config in tools:
         | 
| 111 | 
            +
                            if not hasattr(config, "type") or not (
         | 
| 112 | 
            +
                                hasattr(config, "function") and hasattr(config.function, "name")
         | 
| 113 | 
            +
                            ):
         | 
| 114 | 
            +
                                continue
         | 
| 115 | 
            +
                            if config.type == "function" and config.function.name == func_name:
         | 
| 116 | 
            +
                                if not hasattr(config.function, "parameters"):
         | 
| 117 | 
            +
                                    return {}
         | 
| 118 | 
            +
                                params = config.function.parameters
         | 
| 119 | 
            +
                                if isinstance(params, dict) and "properties" in params:
         | 
| 120 | 
            +
                                    return params["properties"]
         | 
| 121 | 
            +
                                elif isinstance(params, dict):
         | 
| 122 | 
            +
                                    return params
         | 
| 123 | 
            +
                                else:
         | 
| 124 | 
            +
                                    return {}
         | 
| 125 | 
            +
                        logger.warning(f"Tool '{func_name}' is not defined in the tools list.")
         | 
| 126 | 
            +
                        return {}
         | 
| 127 | 
            +
             | 
| 128 | 
            +
                    def convert_param_value(
         | 
| 129 | 
            +
                        param_value: str, param_name: str, param_config: dict, func_name: str
         | 
| 130 | 
            +
                    ) -> Any:
         | 
| 131 | 
            +
                        # Handle null value for any type
         | 
| 132 | 
            +
                        if param_value.lower() == "null":
         | 
| 133 | 
            +
                            return None
         | 
| 134 | 
            +
             | 
| 135 | 
            +
                        if param_name not in param_config:
         | 
| 136 | 
            +
                            if param_config != {}:
         | 
| 137 | 
            +
                                logger.warning(
         | 
| 138 | 
            +
                                    f"Parsed parameter '{param_name}' is not defined in the tool "
         | 
| 139 | 
            +
                                    f"parameters for tool '{func_name}', directly returning the string value."
         | 
| 140 | 
            +
                                )
         | 
| 141 | 
            +
                            return param_value
         | 
| 142 | 
            +
             | 
| 143 | 
            +
                        if (
         | 
| 144 | 
            +
                            isinstance(param_config[param_name], dict)
         | 
| 145 | 
            +
                            and "type" in param_config[param_name]
         | 
| 146 | 
            +
                        ):
         | 
| 147 | 
            +
                            param_type = str(param_config[param_name]["type"]).strip().lower()
         | 
| 148 | 
            +
                        else:
         | 
| 149 | 
            +
                            param_type = "string"
         | 
| 150 | 
            +
                        if param_type in ["string", "str", "text", "varchar", "char", "enum"]:
         | 
| 151 | 
            +
                            return param_value
         | 
| 152 | 
            +
                        elif (
         | 
| 153 | 
            +
                            param_type.startswith("int")
         | 
| 154 | 
            +
                            or param_type.startswith("uint")
         | 
| 155 | 
            +
                            or param_type.startswith("long")
         | 
| 156 | 
            +
                            or param_type.startswith("short")
         | 
| 157 | 
            +
                            or param_type.startswith("unsigned")
         | 
| 158 | 
            +
                        ):
         | 
| 159 | 
            +
                            try:
         | 
| 160 | 
            +
                                param_value = int(param_value)
         | 
| 161 | 
            +
                            except:
         | 
| 162 | 
            +
                                logger.warning(
         | 
| 163 | 
            +
                                    f"Parsed value '{param_value}' of parameter '{param_name}' is not an integer in tool "
         | 
| 164 | 
            +
                                    f"'{func_name}', degenerating to string."
         | 
| 165 | 
            +
                                )
         | 
| 166 | 
            +
                            return param_value
         | 
| 167 | 
            +
                        elif param_type.startswith("num") or param_type.startswith("float"):
         | 
| 168 | 
            +
                            try:
         | 
| 169 | 
            +
                                float_param_value = float(param_value)
         | 
| 170 | 
            +
                                param_value = float_param_value if float_param_value - int(float_param_value) != 0 else int(float_param_value)
         | 
| 171 | 
            +
                            except:
         | 
| 172 | 
            +
                                logger.warning(
         | 
| 173 | 
            +
                                    f"Parsed value '{param_value}' of parameter '{param_name}' is not a float in tool "
         | 
| 174 | 
            +
                                    f"'{func_name}', degenerating to string."
         | 
| 175 | 
            +
                                )
         | 
| 176 | 
            +
                            return param_value
         | 
| 177 | 
            +
                        elif param_type in ["boolean", "bool", "binary"]:
         | 
| 178 | 
            +
                            param_value = param_value.lower()
         | 
| 179 | 
            +
                            if param_value not in ["true", "false"]:
         | 
| 180 | 
            +
                                logger.warning(
         | 
| 181 | 
            +
                                    f"Parsed value '{param_value}' of parameter '{param_name}' is not a boolean (`true` of `false`) in tool '{func_name}', degenerating to false."
         | 
| 182 | 
            +
                                )
         | 
| 183 | 
            +
                            return param_value == "true"
         | 
| 184 | 
            +
                        else:
         | 
| 185 | 
            +
                            if param_type == "object" or param_type.startswith("dict"):
         | 
| 186 | 
            +
                                try:
         | 
| 187 | 
            +
                                    param_value = json.loads(param_value)
         | 
| 188 | 
            +
                                    return param_value
         | 
| 189 | 
            +
                                except:
         | 
| 190 | 
            +
                                    logger.warning(
         | 
| 191 | 
            +
                                        f"Parsed value '{param_value}' of parameter '{param_name}' is not a valid JSON object in tool "
         | 
| 192 | 
            +
                                        f"'{func_name}', will try other methods to parse it."
         | 
| 193 | 
            +
                                    )
         | 
| 194 | 
            +
                            try:
         | 
| 195 | 
            +
                                param_value = eval(param_value)
         | 
| 196 | 
            +
                            except:
         | 
| 197 | 
            +
                                logger.warning(
         | 
| 198 | 
            +
                                    f"Parsed value '{param_value}' of parameter '{param_name}' cannot be converted via Python `eval()` in tool '{func_name}', degenerating to string."
         | 
| 199 | 
            +
                                )
         | 
| 200 | 
            +
                            return param_value
         | 
| 201 | 
            +
             | 
| 202 | 
            +
                    # Extract function name
         | 
| 203 | 
            +
                    end_index = function_call_str.index(">")
         | 
| 204 | 
            +
                    function_name = function_call_str[:end_index]
         | 
| 205 | 
            +
                    param_config = get_arguments_config(function_name)
         | 
| 206 | 
            +
                    parameters = function_call_str[end_index + 1 :]
         | 
| 207 | 
            +
                    param_dict = {}
         | 
| 208 | 
            +
                    for match in self.tool_call_parameter_regex.findall(parameters):
         | 
| 209 | 
            +
                        match_text = match[0] if match[0] else match[1]
         | 
| 210 | 
            +
                        idx = match_text.index(">")
         | 
| 211 | 
            +
                        param_name = match_text[:idx]
         | 
| 212 | 
            +
                        param_value = str(match_text[idx + 1 :])
         | 
| 213 | 
            +
                        # Remove prefix and trailing \n
         | 
| 214 | 
            +
                        if param_value.startswith("\n"):
         | 
| 215 | 
            +
                            param_value = param_value[1:]
         | 
| 216 | 
            +
                        if param_value.endswith("\n"):
         | 
| 217 | 
            +
                            param_value = param_value[:-1]
         | 
| 218 | 
            +
             | 
| 219 | 
            +
                        param_dict[param_name] = convert_param_value(
         | 
| 220 | 
            +
                            param_value, param_name, param_config, function_name
         | 
| 221 | 
            +
                        )
         | 
| 222 | 
            +
                    return ToolCall(
         | 
| 223 | 
            +
                        type="function",
         | 
| 224 | 
            +
                        function=FunctionCall(
         | 
| 225 | 
            +
                            name=function_name, arguments=json.dumps(param_dict, ensure_ascii=False)
         | 
| 226 | 
            +
                        ),
         | 
| 227 | 
            +
                    )
         | 
| 228 | 
            +
             | 
| 229 | 
            +
                def _get_function_calls(self, model_output: str) -> List[str]:
         | 
| 230 | 
            +
                    # Find all tool calls
         | 
| 231 | 
            +
                    matched_ranges = self.tool_call_regex.findall(model_output)
         | 
| 232 | 
            +
                    raw_tool_calls = [
         | 
| 233 | 
            +
                        match[0] if match[0] else match[1] for match in matched_ranges
         | 
| 234 | 
            +
                    ]
         | 
| 235 | 
            +
             | 
| 236 | 
            +
                    # Back-off strategy if no tool_call tags found
         | 
| 237 | 
            +
                    if len(raw_tool_calls) == 0:
         | 
| 238 | 
            +
                        raw_tool_calls = [model_output]
         | 
| 239 | 
            +
             | 
| 240 | 
            +
                    raw_function_calls = []
         | 
| 241 | 
            +
                    for tool_call in raw_tool_calls:
         | 
| 242 | 
            +
                        raw_function_calls.extend(self.tool_call_function_regex.findall(tool_call))
         | 
| 243 | 
            +
             | 
| 244 | 
            +
                    function_calls = [
         | 
| 245 | 
            +
                        match[0] if match[0] else match[1] for match in raw_function_calls
         | 
| 246 | 
            +
                    ]
         | 
| 247 | 
            +
                    return function_calls
         | 
| 248 | 
            +
             | 
| 249 | 
            +
                def extract_tool_calls(
         | 
| 250 | 
            +
                    self,
         | 
| 251 | 
            +
                    model_output: str,
         | 
| 252 | 
            +
                    request: ChatCompletionRequest,
         | 
| 253 | 
            +
                ) -> ExtractedToolCallInformation:
         | 
| 254 | 
            +
                    # Quick check to avoid unnecessary processing
         | 
| 255 | 
            +
                    if self.tool_call_prefix not in model_output:
         | 
| 256 | 
            +
                        return ExtractedToolCallInformation(
         | 
| 257 | 
            +
                            tools_called=False, tool_calls=[], content=model_output
         | 
| 258 | 
            +
                        )
         | 
| 259 | 
            +
             | 
| 260 | 
            +
                    try:
         | 
| 261 | 
            +
                        function_calls = self._get_function_calls(model_output)
         | 
| 262 | 
            +
                        if len(function_calls) == 0:
         | 
| 263 | 
            +
                            return ExtractedToolCallInformation(
         | 
| 264 | 
            +
                                tools_called=False, tool_calls=[], content=model_output
         | 
| 265 | 
            +
                            )
         | 
| 266 | 
            +
             | 
| 267 | 
            +
                        tool_calls = [
         | 
| 268 | 
            +
                            self._parse_xml_function_call(function_call_str, request.tools)
         | 
| 269 | 
            +
                            for function_call_str in function_calls
         | 
| 270 | 
            +
                        ]
         | 
| 271 | 
            +
             | 
| 272 | 
            +
                        # Populate prev_tool_call_arr for serving layer to set finish_reason
         | 
| 273 | 
            +
                        self.prev_tool_call_arr.clear()  # Clear previous calls
         | 
| 274 | 
            +
                        for tool_call in tool_calls:
         | 
| 275 | 
            +
                            if tool_call:
         | 
| 276 | 
            +
                                self.prev_tool_call_arr.append(
         | 
| 277 | 
            +
                                    {
         | 
| 278 | 
            +
                                        "name": tool_call.function.name,
         | 
| 279 | 
            +
                                        "arguments": tool_call.function.arguments,
         | 
| 280 | 
            +
                                    }
         | 
| 281 | 
            +
                                )
         | 
| 282 | 
            +
             | 
| 283 | 
            +
                        # Extract content before tool calls
         | 
| 284 | 
            +
                        content_index = model_output.find(self.tool_call_start_token)
         | 
| 285 | 
            +
                        content_index = (
         | 
| 286 | 
            +
                            content_index
         | 
| 287 | 
            +
                            if content_index >= 0
         | 
| 288 | 
            +
                            else model_output.find(self.tool_call_prefix)
         | 
| 289 | 
            +
                        )
         | 
| 290 | 
            +
                        content = model_output[:content_index]  # .rstrip()
         | 
| 291 | 
            +
             | 
| 292 | 
            +
                        return ExtractedToolCallInformation(
         | 
| 293 | 
            +
                            tools_called=(len(tool_calls) > 0),
         | 
| 294 | 
            +
                            tool_calls=tool_calls,
         | 
| 295 | 
            +
                            content=content if content else None,
         | 
| 296 | 
            +
                        )
         | 
| 297 | 
            +
             | 
| 298 | 
            +
                    except Exception:
         | 
| 299 | 
            +
                        logger.exception("Error in extracting tool call from response.")
         | 
| 300 | 
            +
                        return ExtractedToolCallInformation(
         | 
| 301 | 
            +
                            tools_called=False, tool_calls=[], content=model_output
         | 
| 302 | 
            +
                        )
         | 
| 303 | 
            +
             | 
| 304 | 
            +
                def extract_tool_calls_streaming(
         | 
| 305 | 
            +
                    self,
         | 
| 306 | 
            +
                    previous_text: str,
         | 
| 307 | 
            +
                    current_text: str,
         | 
| 308 | 
            +
                    delta_text: str,
         | 
| 309 | 
            +
                    previous_token_ids: Sequence[int],
         | 
| 310 | 
            +
                    current_token_ids: Sequence[int],
         | 
| 311 | 
            +
                    delta_token_ids: Sequence[int],
         | 
| 312 | 
            +
                    request: ChatCompletionRequest,
         | 
| 313 | 
            +
                ) -> Union[DeltaMessage, None]:
         | 
| 314 | 
            +
                    # If no delta text, return None unless it's an EOS token after tool calls
         | 
| 315 | 
            +
                    if not delta_text:
         | 
| 316 | 
            +
                        # Check if this is an EOS token after all tool calls are complete
         | 
| 317 | 
            +
                        # We check for tool calls in the text even if is_tool_call_started is False
         | 
| 318 | 
            +
                        # because it might have been reset after processing all tools
         | 
| 319 | 
            +
                        if delta_token_ids and self.tool_call_end_token_id not in delta_token_ids:
         | 
| 320 | 
            +
                            # Count complete tool calls
         | 
| 321 | 
            +
                            complete_calls = len(
         | 
| 322 | 
            +
                                self.tool_call_complete_regex.findall(current_text)
         | 
| 323 | 
            +
                            )
         | 
| 324 | 
            +
             | 
| 325 | 
            +
                            # If we have completed tool calls and populated prev_tool_call_arr
         | 
| 326 | 
            +
                            if complete_calls > 0 and len(self.prev_tool_call_arr) > 0:
         | 
| 327 | 
            +
                                # Check if all tool calls are closed
         | 
| 328 | 
            +
                                open_calls = current_text.count(
         | 
| 329 | 
            +
                                    self.tool_call_start_token
         | 
| 330 | 
            +
                                ) - current_text.count(self.tool_call_end_token)
         | 
| 331 | 
            +
                                if open_calls == 0:
         | 
| 332 | 
            +
                                    # Return empty delta message to allow finish_reason processing
         | 
| 333 | 
            +
                                    return DeltaMessage(content="")
         | 
| 334 | 
            +
                            elif not self.is_tool_call_started and current_text:
         | 
| 335 | 
            +
                                # This is a regular content response that's now complete
         | 
| 336 | 
            +
                                return DeltaMessage(content="")
         | 
| 337 | 
            +
                        return None
         | 
| 338 | 
            +
             | 
| 339 | 
            +
                    # Check if this is the first call (reset state if needed)
         | 
| 340 | 
            +
                    if not previous_text:
         | 
| 341 | 
            +
                        self._reset_streaming_state()
         | 
| 342 | 
            +
             | 
| 343 | 
            +
                    # Update accumulated text
         | 
| 344 | 
            +
                    self.accumulated_text = current_text
         | 
| 345 | 
            +
             | 
| 346 | 
            +
                    # Check if we need to advance to next tool
         | 
| 347 | 
            +
                    if self.json_closed and not self.in_function:
         | 
| 348 | 
            +
                        # Check if this tool call has ended
         | 
| 349 | 
            +
                        tool_ends = current_text.count(self.tool_call_end_token)
         | 
| 350 | 
            +
                        if tool_ends > self.current_tool_index:
         | 
| 351 | 
            +
                            # This tool has ended, advance to next
         | 
| 352 | 
            +
                            self.current_tool_index += 1
         | 
| 353 | 
            +
                            self.header_sent = False
         | 
| 354 | 
            +
                            self.param_count = 0
         | 
| 355 | 
            +
                            self.json_started = False
         | 
| 356 | 
            +
                            self.json_closed = False
         | 
| 357 | 
            +
             | 
| 358 | 
            +
                            # Check if there are more tool calls
         | 
| 359 | 
            +
                            tool_starts = current_text.count(self.tool_call_start_token)
         | 
| 360 | 
            +
                            if self.current_tool_index >= tool_starts:
         | 
| 361 | 
            +
                                # No more tool calls
         | 
| 362 | 
            +
                                self.is_tool_call_started = False
         | 
| 363 | 
            +
                            # Continue processing next tool
         | 
| 364 | 
            +
                            return None
         | 
| 365 | 
            +
             | 
| 366 | 
            +
                    # Handle normal content before tool calls
         | 
| 367 | 
            +
                    if not self.is_tool_call_started:
         | 
| 368 | 
            +
                        # Check if tool call is starting
         | 
| 369 | 
            +
                        if (
         | 
| 370 | 
            +
                            self.tool_call_start_token_id in delta_token_ids
         | 
| 371 | 
            +
                            or self.tool_call_start_token in delta_text
         | 
| 372 | 
            +
                        ):
         | 
| 373 | 
            +
                            self.is_tool_call_started = True
         | 
| 374 | 
            +
                            # Return any content before the tool call
         | 
| 375 | 
            +
                            if self.tool_call_start_token in delta_text:
         | 
| 376 | 
            +
                                content_before = delta_text[
         | 
| 377 | 
            +
                                    : delta_text.index(self.tool_call_start_token)
         | 
| 378 | 
            +
                                ]
         | 
| 379 | 
            +
                                if content_before:
         | 
| 380 | 
            +
                                    return DeltaMessage(content=content_before)
         | 
| 381 | 
            +
                            return None
         | 
| 382 | 
            +
                        else:
         | 
| 383 | 
            +
                            # Check if we're between tool calls - skip whitespace
         | 
| 384 | 
            +
                            if current_text.rstrip().endswith(self.tool_call_end_token):
         | 
| 385 | 
            +
                                # We just ended a tool call, skip whitespace
         | 
| 386 | 
            +
                                if delta_text.strip() == "":
         | 
| 387 | 
            +
                                    return None
         | 
| 388 | 
            +
                            # Normal content, no tool call
         | 
| 389 | 
            +
                            return DeltaMessage(content=delta_text)
         | 
| 390 | 
            +
             | 
| 391 | 
            +
                    # Check if we're between tool calls (waiting for next one)
         | 
| 392 | 
            +
                    # Count tool calls we've seen vs processed
         | 
| 393 | 
            +
                    tool_starts_count = current_text.count(self.tool_call_start_token)
         | 
| 394 | 
            +
                    if self.current_tool_index >= tool_starts_count:
         | 
| 395 | 
            +
                        # We're past all tool calls, shouldn't be here
         | 
| 396 | 
            +
                        return None
         | 
| 397 | 
            +
             | 
| 398 | 
            +
                    # We're in a tool call, find the current tool call portion
         | 
| 399 | 
            +
                    # Need to find the correct tool call based on current_tool_index
         | 
| 400 | 
            +
                    tool_starts = []
         | 
| 401 | 
            +
                    idx = 0
         | 
| 402 | 
            +
                    while True:
         | 
| 403 | 
            +
                        idx = current_text.find(self.tool_call_start_token, idx)
         | 
| 404 | 
            +
                        if idx == -1:
         | 
| 405 | 
            +
                            break
         | 
| 406 | 
            +
                        tool_starts.append(idx)
         | 
| 407 | 
            +
                        idx += len(self.tool_call_start_token)
         | 
| 408 | 
            +
             | 
| 409 | 
            +
                    if self.current_tool_index >= len(tool_starts):
         | 
| 410 | 
            +
                        # No more tool calls to process yet
         | 
| 411 | 
            +
                        return None
         | 
| 412 | 
            +
             | 
| 413 | 
            +
                    tool_start_idx = tool_starts[self.current_tool_index]
         | 
| 414 | 
            +
                    # Find where this tool call ends (or current position if not ended yet)
         | 
| 415 | 
            +
                    tool_end_idx = current_text.find(self.tool_call_end_token, tool_start_idx)
         | 
| 416 | 
            +
                    if tool_end_idx == -1:
         | 
| 417 | 
            +
                        tool_text = current_text[tool_start_idx:]
         | 
| 418 | 
            +
                    else:
         | 
| 419 | 
            +
                        tool_text = current_text[
         | 
| 420 | 
            +
                            tool_start_idx : tool_end_idx + len(self.tool_call_end_token)
         | 
| 421 | 
            +
                        ]
         | 
| 422 | 
            +
             | 
| 423 | 
            +
                    # Looking for function header
         | 
| 424 | 
            +
                    if not self.header_sent:
         | 
| 425 | 
            +
                        if self.tool_call_prefix in tool_text:
         | 
| 426 | 
            +
                            func_start = tool_text.find(self.tool_call_prefix) + len(
         | 
| 427 | 
            +
                                self.tool_call_prefix
         | 
| 428 | 
            +
                            )
         | 
| 429 | 
            +
                            func_end = tool_text.find(">", func_start)
         | 
| 430 | 
            +
             | 
| 431 | 
            +
                            if func_end != -1:
         | 
| 432 | 
            +
                                # Found complete function name
         | 
| 433 | 
            +
                                self.current_function_name = tool_text[func_start:func_end]
         | 
| 434 | 
            +
                                self.current_tool_id = self._generate_tool_call_id()
         | 
| 435 | 
            +
                                self.header_sent = True
         | 
| 436 | 
            +
                                self.in_function = True
         | 
| 437 | 
            +
             | 
| 438 | 
            +
                                # IMPORTANT: Add to prev_tool_call_arr immediately when we detect a tool call
         | 
| 439 | 
            +
                                # This ensures finish_reason="tool_calls" even if parsing isn't complete
         | 
| 440 | 
            +
                                already_added = any(
         | 
| 441 | 
            +
                                    tool.get("name") == self.current_function_name
         | 
| 442 | 
            +
                                    for tool in self.prev_tool_call_arr
         | 
| 443 | 
            +
                                )
         | 
| 444 | 
            +
                                if not already_added:
         | 
| 445 | 
            +
                                    self.prev_tool_call_arr.append(
         | 
| 446 | 
            +
                                        {
         | 
| 447 | 
            +
                                            "name": self.current_function_name,
         | 
| 448 | 
            +
                                            "arguments": "{}",  # Placeholder, will be updated later
         | 
| 449 | 
            +
                                        }
         | 
| 450 | 
            +
                                    )
         | 
| 451 | 
            +
             | 
| 452 | 
            +
                                # Send header with function info
         | 
| 453 | 
            +
                                return DeltaMessage(
         | 
| 454 | 
            +
                                    tool_calls=[
         | 
| 455 | 
            +
                                        DeltaToolCall(
         | 
| 456 | 
            +
                                            index=self.current_tool_index,
         | 
| 457 | 
            +
                                            id=self.current_tool_id,
         | 
| 458 | 
            +
                                            function=DeltaFunctionCall(
         | 
| 459 | 
            +
                                                name=self.current_function_name, arguments=""
         | 
| 460 | 
            +
                                            ),
         | 
| 461 | 
            +
                                            type="function",
         | 
| 462 | 
            +
                                        )
         | 
| 463 | 
            +
                                    ]
         | 
| 464 | 
            +
                                )
         | 
| 465 | 
            +
                        return None
         | 
| 466 | 
            +
             | 
| 467 | 
            +
                    # We've sent header, now handle function body
         | 
| 468 | 
            +
                    if self.in_function:
         | 
| 469 | 
            +
                        # Send opening brace if not sent yet
         | 
| 470 | 
            +
                        if not self.json_started and not self.parameter_prefix in delta_text:
         | 
| 471 | 
            +
                            self.json_started = True
         | 
| 472 | 
            +
                            return DeltaMessage(
         | 
| 473 | 
            +
                                tool_calls=[
         | 
| 474 | 
            +
                                    DeltaToolCall(
         | 
| 475 | 
            +
                                        index=self.current_tool_index,
         | 
| 476 | 
            +
                                        function=DeltaFunctionCall(arguments="{"),
         | 
| 477 | 
            +
                                    )
         | 
| 478 | 
            +
                                ]
         | 
| 479 | 
            +
                            )
         | 
| 480 | 
            +
             | 
| 481 | 
            +
                        # Make sure json_started is set if we're processing parameters
         | 
| 482 | 
            +
                        if not self.json_started:
         | 
| 483 | 
            +
                            self.json_started = True
         | 
| 484 | 
            +
             | 
| 485 | 
            +
                        # Check for function end in accumulated text
         | 
| 486 | 
            +
                        if not self.json_closed and self.function_end_token in tool_text:
         | 
| 487 | 
            +
                            # Close JSON
         | 
| 488 | 
            +
                            self.json_closed = True
         | 
| 489 | 
            +
             | 
| 490 | 
            +
                            # Extract the complete tool call to update prev_tool_call_arr with final arguments
         | 
| 491 | 
            +
                            # Find the function content
         | 
| 492 | 
            +
                            func_start = tool_text.find(self.tool_call_prefix) + len(
         | 
| 493 | 
            +
                                self.tool_call_prefix
         | 
| 494 | 
            +
                            )
         | 
| 495 | 
            +
                            func_content_end = tool_text.find(self.function_end_token, func_start)
         | 
| 496 | 
            +
                            if func_content_end != -1:
         | 
| 497 | 
            +
                                func_content = tool_text[func_start:func_content_end]
         | 
| 498 | 
            +
                                # Parse to get the complete arguments
         | 
| 499 | 
            +
                                try:
         | 
| 500 | 
            +
                                    parsed_tool = self._parse_xml_function_call(
         | 
| 501 | 
            +
                                        func_content, request.tools if request else None
         | 
| 502 | 
            +
                                    )
         | 
| 503 | 
            +
                                    if parsed_tool:
         | 
| 504 | 
            +
                                        # Update existing entry in prev_tool_call_arr with complete arguments
         | 
| 505 | 
            +
                                        for i, tool in enumerate(self.prev_tool_call_arr):
         | 
| 506 | 
            +
                                            if tool.get("name") == parsed_tool.function.name:
         | 
| 507 | 
            +
                                                self.prev_tool_call_arr[i]["arguments"] = (
         | 
| 508 | 
            +
                                                    parsed_tool.function.arguments
         | 
| 509 | 
            +
                                                )
         | 
| 510 | 
            +
                                                break
         | 
| 511 | 
            +
                                except Exception:
         | 
| 512 | 
            +
                                    pass  # Ignore parsing errors during streaming
         | 
| 513 | 
            +
             | 
| 514 | 
            +
                            result = DeltaMessage(
         | 
| 515 | 
            +
                                tool_calls=[
         | 
| 516 | 
            +
                                    DeltaToolCall(
         | 
| 517 | 
            +
                                        index=self.current_tool_index,
         | 
| 518 | 
            +
                                        function=DeltaFunctionCall(arguments="}"),
         | 
| 519 | 
            +
                                    )
         | 
| 520 | 
            +
                                ]
         | 
| 521 | 
            +
                            )
         | 
| 522 | 
            +
             | 
| 523 | 
            +
                            # Reset state for next tool
         | 
| 524 | 
            +
                            self.in_function = False
         | 
| 525 | 
            +
                            self.json_closed = True
         | 
| 526 | 
            +
             | 
| 527 | 
            +
                            return result
         | 
| 528 | 
            +
             | 
| 529 | 
            +
                        # Look for parameters
         | 
| 530 | 
            +
                        # Count how many complete parameters we have processed
         | 
| 531 | 
            +
                        complete_params = tool_text.count(self.parameter_end_token)
         | 
| 532 | 
            +
             | 
| 533 | 
            +
                        # Check if we should start a new parameter
         | 
| 534 | 
            +
                        if not self.in_param and self.param_count < complete_params:
         | 
| 535 | 
            +
                            # Find the unprocessed parameter
         | 
| 536 | 
            +
                            # Count parameter starts
         | 
| 537 | 
            +
                            param_starts = []
         | 
| 538 | 
            +
                            idx = 0
         | 
| 539 | 
            +
                            while True:
         | 
| 540 | 
            +
                                idx = tool_text.find(self.parameter_prefix, idx)
         | 
| 541 | 
            +
                                if idx == -1:
         | 
| 542 | 
            +
                                    break
         | 
| 543 | 
            +
                                param_starts.append(idx)
         | 
| 544 | 
            +
                                idx += len(self.parameter_prefix)
         | 
| 545 | 
            +
             | 
| 546 | 
            +
                            if len(param_starts) > self.param_count:
         | 
| 547 | 
            +
                                # Process the next parameter
         | 
| 548 | 
            +
                                param_idx = param_starts[self.param_count]
         | 
| 549 | 
            +
                                param_start = param_idx + len(self.parameter_prefix)
         | 
| 550 | 
            +
                                remaining = tool_text[param_start:]
         | 
| 551 | 
            +
             | 
| 552 | 
            +
                                if ">" in remaining:
         | 
| 553 | 
            +
                                    # We have the complete parameter name
         | 
| 554 | 
            +
                                    name_end = remaining.find(">")
         | 
| 555 | 
            +
                                    self.current_param_name = remaining[:name_end]
         | 
| 556 | 
            +
             | 
| 557 | 
            +
                                    # Find the parameter value
         | 
| 558 | 
            +
                                    value_start = param_start + name_end + 1
         | 
| 559 | 
            +
                                    value_text = tool_text[value_start:]
         | 
| 560 | 
            +
                                    if value_text.startswith("\n"):
         | 
| 561 | 
            +
                                        value_text = value_text[1:]
         | 
| 562 | 
            +
             | 
| 563 | 
            +
                                    # Find where this parameter ends
         | 
| 564 | 
            +
                                    param_end_idx = value_text.find(self.parameter_end_token)
         | 
| 565 | 
            +
                                    if param_end_idx != -1:
         | 
| 566 | 
            +
                                        # Complete parameter found
         | 
| 567 | 
            +
                                        param_value = value_text[:param_end_idx]
         | 
| 568 | 
            +
                                        if param_value.endswith("\n"):
         | 
| 569 | 
            +
                                            param_value = param_value[:-1]
         | 
| 570 | 
            +
             | 
| 571 | 
            +
                                        # Build complete JSON fragment for this parameter
         | 
| 572 | 
            +
                                        if self.param_count == 0:
         | 
| 573 | 
            +
                                            json_fragment = (
         | 
| 574 | 
            +
                                                '"'
         | 
| 575 | 
            +
                                                + self.current_param_name
         | 
| 576 | 
            +
                                                + '": "'
         | 
| 577 | 
            +
                                                + json.dumps(param_value)[1:-1]
         | 
| 578 | 
            +
                                                + '"'
         | 
| 579 | 
            +
                                            )
         | 
| 580 | 
            +
                                        else:
         | 
| 581 | 
            +
                                            json_fragment = (
         | 
| 582 | 
            +
                                                ', "'
         | 
| 583 | 
            +
                                                + self.current_param_name
         | 
| 584 | 
            +
                                                + '": "'
         | 
| 585 | 
            +
                                                + json.dumps(param_value)[1:-1]
         | 
| 586 | 
            +
                                                + '"'
         | 
| 587 | 
            +
                                            )
         | 
| 588 | 
            +
             | 
| 589 | 
            +
                                        self.param_count += 1
         | 
| 590 | 
            +
             | 
| 591 | 
            +
                                        return DeltaMessage(
         | 
| 592 | 
            +
                                            tool_calls=[
         | 
| 593 | 
            +
                                                DeltaToolCall(
         | 
| 594 | 
            +
                                                    index=self.current_tool_index,
         | 
| 595 | 
            +
                                                    function=DeltaFunctionCall(
         | 
| 596 | 
            +
                                                        arguments=json_fragment
         | 
| 597 | 
            +
                                                    ),
         | 
| 598 | 
            +
                                                )
         | 
| 599 | 
            +
                                            ]
         | 
| 600 | 
            +
                                        )
         | 
| 601 | 
            +
             | 
| 602 | 
            +
                        # Continue parameter value
         | 
| 603 | 
            +
                        if self.in_param:
         | 
| 604 | 
            +
                            if self.parameter_end_token in delta_text:
         | 
| 605 | 
            +
                                # End of parameter
         | 
| 606 | 
            +
                                end_idx = delta_text.find(self.parameter_end_token)
         | 
| 607 | 
            +
                                value_chunk = delta_text[:end_idx]
         | 
| 608 | 
            +
             | 
| 609 | 
            +
                                # Skip past > if at start
         | 
| 610 | 
            +
                                if not self.current_param_value and ">" in value_chunk:
         | 
| 611 | 
            +
                                    gt_idx = value_chunk.find(">")
         | 
| 612 | 
            +
                                    value_chunk = value_chunk[gt_idx + 1 :]
         | 
| 613 | 
            +
             | 
| 614 | 
            +
                                if not self.current_param_value and value_chunk.startswith("\n"):
         | 
| 615 | 
            +
                                    value_chunk = value_chunk[1:]
         | 
| 616 | 
            +
             | 
| 617 | 
            +
                                # Calculate incremental JSON
         | 
| 618 | 
            +
                                full_value = self.current_param_value + value_chunk
         | 
| 619 | 
            +
                                prev_escaped = (
         | 
| 620 | 
            +
                                    json.dumps(self.current_param_value)[1:-1]
         | 
| 621 | 
            +
                                    if self.current_param_value
         | 
| 622 | 
            +
                                    else ""
         | 
| 623 | 
            +
                                )
         | 
| 624 | 
            +
                                full_escaped = json.dumps(full_value)[1:-1]
         | 
| 625 | 
            +
                                delta_escaped = full_escaped[len(prev_escaped) :]
         | 
| 626 | 
            +
             | 
| 627 | 
            +
                                self.in_param = False
         | 
| 628 | 
            +
                                self.current_param_value = ""
         | 
| 629 | 
            +
             | 
| 630 | 
            +
                                return DeltaMessage(
         | 
| 631 | 
            +
                                    tool_calls=[
         | 
| 632 | 
            +
                                        DeltaToolCall(
         | 
| 633 | 
            +
                                            index=self.current_tool_index,
         | 
| 634 | 
            +
                                            function=DeltaFunctionCall(
         | 
| 635 | 
            +
                                                arguments=delta_escaped + '"'
         | 
| 636 | 
            +
                                            ),
         | 
| 637 | 
            +
                                        )
         | 
| 638 | 
            +
                                    ]
         | 
| 639 | 
            +
                                )
         | 
| 640 | 
            +
                            else:
         | 
| 641 | 
            +
                                # Continue accumulating value
         | 
| 642 | 
            +
                                value_chunk = delta_text
         | 
| 643 | 
            +
             | 
| 644 | 
            +
                                # Handle first chunk after param name
         | 
| 645 | 
            +
                                if not self.current_param_value and ">" in value_chunk:
         | 
| 646 | 
            +
                                    gt_idx = value_chunk.find(">")
         | 
| 647 | 
            +
                                    value_chunk = value_chunk[gt_idx + 1 :]
         | 
| 648 | 
            +
             | 
| 649 | 
            +
                                if not self.current_param_value and value_chunk.startswith("\n"):
         | 
| 650 | 
            +
                                    value_chunk = value_chunk[1:]
         | 
| 651 | 
            +
             | 
| 652 | 
            +
                                if value_chunk:
         | 
| 653 | 
            +
                                    # Stream the escaped delta
         | 
| 654 | 
            +
                                    prev_escaped = (
         | 
| 655 | 
            +
                                        json.dumps(self.current_param_value)[1:-1]
         | 
| 656 | 
            +
                                        if self.current_param_value
         | 
| 657 | 
            +
                                        else ""
         | 
| 658 | 
            +
                                    )
         | 
| 659 | 
            +
                                    self.current_param_value += value_chunk
         | 
| 660 | 
            +
                                    full_escaped = json.dumps(self.current_param_value)[1:-1]
         | 
| 661 | 
            +
                                    delta_escaped = full_escaped[len(prev_escaped) :]
         | 
| 662 | 
            +
             | 
| 663 | 
            +
                                    if delta_escaped:
         | 
| 664 | 
            +
                                        return DeltaMessage(
         | 
| 665 | 
            +
                                            tool_calls=[
         | 
| 666 | 
            +
                                                DeltaToolCall(
         | 
| 667 | 
            +
                                                    index=self.current_tool_index,
         | 
| 668 | 
            +
                                                    function=DeltaFunctionCall(
         | 
| 669 | 
            +
                                                        arguments=delta_escaped
         | 
| 670 | 
            +
                                                    ),
         | 
| 671 | 
            +
                                                )
         | 
| 672 | 
            +
                                            ]
         | 
| 673 | 
            +
                                        )
         | 
| 674 | 
            +
             | 
| 675 | 
            +
                    return None
         | 

