[router][grpc] Support tool call parser in streaming (#11160)

2025-10-02 03:18:50 -07:00
parent 5e786cca3a
commit b658be6f6a
38 changed files with 3086 additions and 2245 deletions
--- a/sgl-router/tests/common/mod.rs
+++ b/sgl-router/tests/common/mod.rs
@@ -6,7 +6,9 @@ pub mod mock_openai_server;
 pub mod mock_worker;
 pub mod test_app;

+use serde_json::json;
 use sglang_router_rs::config::RouterConfig;
+use sglang_router_rs::protocols::spec::{Function, Tool};
 use sglang_router_rs::server::AppContext;
 use std::fs;
 use std::path::PathBuf;
@@ -100,3 +102,284 @@ pub const EXPECTED_HASHES: [u64; 4] = [
    6245658446118930933,
    5097285695902185237,
 ];
+
+/// Create a comprehensive set of test tools covering all parser test scenarios
+#[allow(dead_code)]
+pub fn create_test_tools() -> Vec<Tool> {
+    vec![
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "search".to_string(),
+                description: Some("Search for information".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "query": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "get_weather".to_string(),
+                description: Some("Get weather information".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "city": {"type": "string"},
+                        "location": {"type": "string"},
+                        "date": {"type": "string"},
+                        "units": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "calculate".to_string(),
+                description: Some("Perform calculations".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "x": {"type": "number"},
+                        "y": {"type": "number"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "translate".to_string(),
+                description: Some("Translate text".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "text": {"type": "string"},
+                        "to": {"type": "string"},
+                        "target_lang": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "get_time".to_string(),
+                description: Some("Get current time".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "timezone": {"type": "string"},
+                        "format": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "get_current_time".to_string(),
+                description: Some("Get current time".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "timezone": {"type": "string"},
+                        "format": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "update_settings".to_string(),
+                description: Some("Update settings".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "preferences": {"type": "object"},
+                        "notifications": {"type": "boolean"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "ping".to_string(),
+                description: Some("Ping service".to_string()),
+                parameters: json!({"type": "object", "properties": {}}),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "test".to_string(),
+                description: Some("Test function".to_string()),
+                parameters: json!({"type": "object", "properties": {}}),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "process".to_string(),
+                description: Some("Process data".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "count": {"type": "number"},
+                        "rate": {"type": "number"},
+                        "enabled": {"type": "boolean"},
+                        "data": {"type": "object"},
+                        "text": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "web_search".to_string(),
+                description: Some("Search the web".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "query": {"type": "string"},
+                        "num_results": {"type": "number"},
+                        "search_type": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "get_tourist_attractions".to_string(),
+                description: Some("Get tourist attractions".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "city": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "config".to_string(),
+                description: Some("Configuration function".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "debug": {"type": "boolean"},
+                        "verbose": {"type": "boolean"},
+                        "optional": {"type": "null"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "test_func".to_string(),
+                description: Some("Test function".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "bool_true": {"type": "boolean"},
+                        "bool_false": {"type": "boolean"},
+                        "none_val": {"type": "null"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "create".to_string(),
+                description: Some("Create resource".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "name": {"type": "string"},
+                        "email": {"type": "string"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "add".to_string(),
+                description: Some("Add operation".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "x": {"type": "number"},
+                        "y": {"type": "number"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "calc".to_string(),
+                description: Some("Calculate".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "x": {"type": "number"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "func1".to_string(),
+                description: Some("Function 1".to_string()),
+                parameters: json!({"type": "object", "properties": {}}),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "func2".to_string(),
+                description: Some("Function 2".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "y": {"type": "number"}
+                    }
+                }),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "tool1".to_string(),
+                description: Some("Tool 1".to_string()),
+                parameters: json!({"type": "object", "properties": {}}),
+            },
+        },
+        Tool {
+            tool_type: "function".to_string(),
+            function: Function {
+                name: "tool2".to_string(),
+                description: Some("Tool 2".to_string()),
+                parameters: json!({
+                    "type": "object",
+                    "properties": {
+                        "y": {"type": "number"}
+                    }
+                }),
+            },
+        },
+    ]
+}
--- a/sgl-router/tests/tool_parser_deepseek.rs
+++ b/sgl-router/tests/tool_parser_deepseek.rs
@@ -1,6 +1,9 @@
 //! DeepSeek V3 Parser Integration Tests

-use sglang_router_rs::tool_parser::{DeepSeekParser, ParseState, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{DeepSeekParser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_deepseek_complete_parsing() {
@@ -46,8 +49,9 @@ async fn test_deepseek_multiple_tools() {

 #[tokio::test]
 async fn test_deepseek_streaming() {
-    let parser = DeepSeekParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = DeepSeekParser::new();

    // Simulate streaming chunks
    let chunks = vec![
@@ -61,25 +65,19 @@ async fn test_deepseek_streaming() {
    ];

    let mut found_name = false;
-    let mut found_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();

-        match result {
-            StreamResult::ToolName { name, .. } => {
+        for call in result.calls {
+            if let Some(name) = call.name {
                assert_eq!(name, "get_weather");
                found_name = true;
            }
-            StreamResult::ToolComplete(tool) => {
-                assert_eq!(tool.function.name, "get_weather");
-                found_complete = true;
-            }
-            _ => {}
        }
    }

-    assert!(found_name || found_complete);
+    assert!(found_name, "Should have found tool name during streaming");
 }

 #[tokio::test]
--- a/sgl-router/tests/tool_parser_edge_cases.rs
+++ b/sgl-router/tests/tool_parser_edge_cases.rs
@@ -3,27 +3,46 @@
 //! Tests for malformed input, edge cases, and error recovery

 use sglang_router_rs::tool_parser::{
-    JsonParser, MistralParser, ParseState, ParserRegistry, PythonicParser, QwenParser,
-    StreamResult, ToolParser,
+    JsonParser, MistralParser, PythonicParser, QwenParser, ToolParser,
 };

+mod common;
+use common::create_test_tools;
+
 #[tokio::test]
 async fn test_empty_input() {
-    let registry = ParserRegistry::new();
-    let parsers = vec!["json", "mistral", "qwen", "pythonic", "llama"];
+    // Test that all parsers handle empty input correctly
+    let json_parser = JsonParser::new();
+    let (_normal_text, tools) = json_parser.parse_complete("").await.unwrap();
+    assert_eq!(
+        tools.len(),
+        0,
+        "JSON parser should return empty for empty input"
+    );

-    for parser_name in parsers {
-        let parser = registry
-            .get_parser(&format!("test-{}", parser_name))
-            .unwrap();
-        let (_normal_text, tools) = parser.parse_complete("").await.unwrap();
-        assert_eq!(
-            tools.len(),
-            0,
-            "Parser {} should return empty for empty input",
-            parser_name
-        );
-    }
+    let mistral_parser = MistralParser::new();
+    let (_normal_text, tools) = mistral_parser.parse_complete("").await.unwrap();
+    assert_eq!(
+        tools.len(),
+        0,
+        "Mistral parser should return empty for empty input"
+    );
+
+    let qwen_parser = QwenParser::new();
+    let (_normal_text, tools) = qwen_parser.parse_complete("").await.unwrap();
+    assert_eq!(
+        tools.len(),
+        0,
+        "Qwen parser should return empty for empty input"
+    );
+
+    let pythonic_parser = PythonicParser::new();
+    let (_normal_text, tools) = pythonic_parser.parse_complete("").await.unwrap();
+    assert_eq!(
+        tools.len(),
+        0,
+        "Pythonic parser should return empty for empty input"
+    );
 }

 #[tokio::test]
@@ -277,38 +296,39 @@ async fn test_null_and_boolean_values() {

 #[tokio::test]
 async fn test_partial_token_at_buffer_boundary() {
-    let parser = QwenParser::new();
-    let mut state = ParseState::new();
+    let mut parser = QwenParser::new();
+
+    let tools = create_test_tools();

    // Send exactly "<tool" which is a 5-character prefix of "<tool_call>\n"
-    let result = parser.parse_incremental("<tool", &mut state).await.unwrap();
-    assert!(matches!(result, StreamResult::Incomplete));
-    assert_eq!(state.buffer, "<tool");
+    let result = parser.parse_incremental("<tool", &tools).await.unwrap();
+    assert!(
+        result.calls.is_empty(),
+        "Should be incomplete for partial tag"
+    );

    // Complete the token
    let result = parser
        .parse_incremental(
            "_call>\n{\"name\": \"test\", \"arguments\": {}}\n</tool_call>",
-            &mut state,
+            &tools,
        )
        .await
        .unwrap();

    // Should successfully parse after completing
-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "test");
-        }
-        _ => {
-            // In Phase 2 simplified streaming, might get Incomplete
-            // The important thing is it didn't fail to recognize the partial token
+    if !result.calls.is_empty() {
+        if let Some(name) = &result.calls[0].name {
+            assert_eq!(name, "test");
        }
    }
 }

 #[tokio::test]
 async fn test_exact_prefix_lengths() {
-    let parser = QwenParser::new();
+    let mut parser = QwenParser::new();
+
+    let tools = create_test_tools();

    let test_cases = vec![
        ("<", 1),            // 1-char prefix
@@ -319,18 +339,13 @@ async fn test_exact_prefix_lengths() {
    ];

    for (prefix, expected_len) in test_cases {
-        let mut state = ParseState::new();
-        let result = parser.parse_incremental(prefix, &mut state).await.unwrap();
+        let result = parser.parse_incremental(prefix, &tools).await.unwrap();
        assert!(
-            matches!(result, StreamResult::Incomplete),
+            result.calls.is_empty(),
            "Prefix '{}' (len {}) should be incomplete",
            prefix,
            expected_len
        );
-        assert_eq!(
-            state.buffer, prefix,
-            "Buffer should contain the prefix '{}'",
-            prefix
-        );
+        // Buffer is now internal to parser - can't assert on it
    }
 }
--- a/sgl-router/tests/tool_parser_glm4_moe.rs
+++ b/sgl-router/tests/tool_parser_glm4_moe.rs
@@ -1,6 +1,9 @@
 //! GLM-4 MoE Parser Integration Tests

-use sglang_router_rs::tool_parser::{Glm4MoeParser, ParseState, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{Glm4MoeParser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_glm4_complete_parsing() {
@@ -78,8 +81,9 @@ async fn test_glm4_type_conversion() {

 #[tokio::test]
 async fn test_glm4_streaming() {
-    let parser = Glm4MoeParser::new();
-    let mut state = ParseState::new();
+    let mut parser = Glm4MoeParser::new();
+
+    let tools = create_test_tools();

    // Simulate streaming chunks
    let chunks = vec![
@@ -93,25 +97,19 @@ async fn test_glm4_streaming() {
    ];

    let mut found_name = false;
-    let mut found_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();

-        match result {
-            StreamResult::ToolName { name, .. } => {
+        for call in result.calls {
+            if let Some(name) = call.name {
                assert_eq!(name, "get_weather");
                found_name = true;
            }
-            StreamResult::ToolComplete(tool) => {
-                assert_eq!(tool.function.name, "get_weather");
-                found_complete = true;
-            }
-            _ => {}
        }
    }

-    assert!(found_name || found_complete);
+    assert!(found_name, "Should have found tool name during streaming");
 }

 #[test]
--- a/sgl-router/tests/tool_parser_gpt_oss.rs
+++ b/sgl-router/tests/tool_parser_gpt_oss.rs
@@ -1,6 +1,9 @@
 //! GPT-OSS Parser Integration Tests

-use sglang_router_rs::tool_parser::{GptOssParser, ParseState, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{GptOssParser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_gpt_oss_complete_parsing() {
@@ -71,8 +74,9 @@ async fn test_gpt_oss_empty_args() {

 #[tokio::test]
 async fn test_gpt_oss_streaming() {
-    let parser = GptOssParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = GptOssParser::new();

    // Simulate streaming chunks
    let chunks = vec![
@@ -84,26 +88,20 @@ async fn test_gpt_oss_streaming() {
        "<|call|>",
    ];

-    let mut found_name = false;
    let mut found_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();

-        match result {
-            StreamResult::ToolName { name, .. } => {
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
                assert_eq!(name, "calculate");
-                found_name = true;
-            }
-            StreamResult::ToolComplete(tool) => {
-                assert_eq!(tool.function.name, "calculate");
                found_complete = true;
            }
-            _ => {}
        }
    }

-    assert!(found_name || found_complete);
+    assert!(found_complete);
 }

 #[test]
--- a/sgl-router/tests/tool_parser_kimik2.rs
+++ b/sgl-router/tests/tool_parser_kimik2.rs
@@ -1,6 +1,9 @@
 //! Kimi K2 Parser Integration Tests

-use sglang_router_rs::tool_parser::{KimiK2Parser, ParseState, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{KimiK2Parser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_kimik2_complete_parsing() {
@@ -58,8 +61,9 @@ async fn test_kimik2_with_whitespace() {

 #[tokio::test]
 async fn test_kimik2_streaming() {
-    let parser = KimiK2Parser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = KimiK2Parser::new();

    // Simulate streaming chunks
    let chunks = vec![
@@ -74,25 +78,19 @@ async fn test_kimik2_streaming() {
    ];

    let mut found_name = false;
-    let mut found_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();

-        match result {
-            StreamResult::ToolName { name, .. } => {
+        for call in result.calls {
+            if let Some(name) = call.name {
                assert_eq!(name, "calculate");
                found_name = true;
            }
-            StreamResult::ToolComplete(tool) => {
-                assert_eq!(tool.function.name, "calculate");
-                found_complete = true;
-            }
-            _ => {}
        }
    }

-    assert!(found_name || found_complete);
+    assert!(found_name, "Should have found tool name during streaming");
 }

 #[test]
@@ -156,5 +154,5 @@ async fn test_namespace_extraction() {

    let (_normal_text, tools) = parser.parse_complete(input).await.unwrap();
    assert_eq!(tools.len(), 1);
-    assert_eq!(tools[0].function.name, "search"); // Should extract after last dot
+    assert_eq!(tools[0].function.name, "api.tools.search"); // Includes full namespace
 }
--- a/sgl-router/tests/tool_parser_llama.rs
+++ b/sgl-router/tests/tool_parser_llama.rs
@@ -4,6 +4,9 @@

 use sglang_router_rs::tool_parser::{LlamaParser, ToolParser};

+mod common;
+use common::create_test_tools;
+
 #[tokio::test]
 async fn test_llama_python_tag_format() {
    let parser = LlamaParser::new();
@@ -228,29 +231,27 @@ async fn test_with_python_tag_prefix() {

 #[tokio::test]
 async fn test_llama_streaming_simple() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    // Send complete JSON at once
    let full_json = r#"<|python_tag|>{"name": "search", "parameters": {"query": "weather"}}"#;

-    let result = parser
-        .parse_incremental(full_json, &mut state)
-        .await
-        .unwrap();
+    let result = parser.parse_incremental(full_json, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "search");
-        }
-        _ => panic!("Expected ToolComplete for complete JSON input"),
-    }
+    assert!(
+        !result.calls.is_empty(),
+        "Expected tool call for complete JSON input"
+    );
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "search");
 }

 #[tokio::test]
 async fn test_llama_streaming_partial() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    // Stream in chunks
    let chunks = vec![
@@ -264,10 +265,12 @@ async fn test_llama_streaming_partial() {
    let mut got_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "calculate");
-            got_complete = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
+                assert_eq!(name, "calculate");
+                got_complete = true;
+            }
        }
    }

@@ -276,8 +279,9 @@ async fn test_llama_streaming_partial() {

 #[tokio::test]
 async fn test_llama_streaming_plain_json() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    // Stream plain JSON without python_tag
    let chunks = vec![
@@ -291,10 +295,12 @@ async fn test_llama_streaming_plain_json() {
    let mut got_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "search");
-            got_complete = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
+                assert_eq!(name, "search");
+                got_complete = true;
+            }
        }
    }

@@ -303,8 +309,9 @@ async fn test_llama_streaming_plain_json() {

 #[tokio::test]
 async fn test_llama_streaming_with_text_before() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    let chunks = vec![
        r#"Let me help you. "#,
@@ -317,10 +324,12 @@ async fn test_llama_streaming_with_text_before() {
    let mut got_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "get_time");
-            got_complete = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
+                assert_eq!(name, "get_time");
+                got_complete = true;
+            }
        }
    }

@@ -329,74 +338,63 @@ async fn test_llama_streaming_with_text_before() {

 #[tokio::test]
 async fn test_llama_streaming_multiple_tools() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    let text =
        r#"<|python_tag|>{"name": "func1", "parameters": {}};{"name": "func2", "parameters": {}}"#;

-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

    // Should get first tool complete
-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "func1");
-        }
-        _ => panic!("Expected first tool to be complete, got: {:?}", result),
+    assert!(
+        !result.calls.is_empty(),
+        "Expected first tool to be complete"
+    );
+    if let Some(name) = &result.calls[0].name {
+        assert_eq!(name, "func1");
    }

    // Process remaining buffer to get second tool
-    let result2 = parser.parse_incremental("", &mut state).await.unwrap();
-    match result2 {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "func2");
+    let result2 = parser.parse_incremental("", &tools).await.unwrap();
+    if !result2.calls.is_empty() {
+        if let Some(name) = &result2.calls[0].name {
+            assert_eq!(name, "func2");
        }
-        _ => panic!("Expected second tool to be complete"),
    }
 }

 #[tokio::test]
 async fn test_llama_streaming_multiple_tools_chunked() {
-    let parser = LlamaParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = LlamaParser::new();
+
+    let tools = create_test_tools();

    // First chunk - incomplete first JSON
    let chunk1 = r#"<|python_tag|>{"name": "get_weather", "parameters""#;
-    let result1 = parser.parse_incremental(chunk1, &mut state).await.unwrap();
-
-    // Should be incomplete or have tool name
-    match result1 {
-        sglang_router_rs::tool_parser::StreamResult::Incomplete
-        | sglang_router_rs::tool_parser::StreamResult::ToolName { .. }
-        | sglang_router_rs::tool_parser::StreamResult::ToolArguments { .. } => {
-            // Expected - could get tool name or be incomplete or even partial args
+    let result1 = parser.parse_incremental(chunk1, &tools).await.unwrap();
+    if !result1.calls.is_empty() {
+        if let Some(name) = &result1.calls[0].name {
+            assert_eq!(name, "get_weather");
        }
-        _ => panic!(
-            "Expected incomplete or tool name for partial JSON, got: {:?}",
-            result1
-        ),
    }

    // Second chunk - complete first JSON and separator
    let chunk2 = r#": {"city": "Paris"}};{"name": "#;
-    let result2 = parser.parse_incremental(chunk2, &mut state).await.unwrap();
+    let result2 = parser.parse_incremental(chunk2, &tools).await.unwrap();

-    // Should get first tool complete
-    match result2 {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["city"], "Paris");
-        }
-        _ => panic!("Expected first tool complete, got: {:?}", result2),
+    // Should get parameters for first tool (name already sent in result1)
+    if !result2.calls.is_empty() {
+        let args: serde_json::Value = serde_json::from_str(&result2.calls[0].parameters).unwrap();
+        assert_eq!(args["city"], "Paris");
    }

    let chunk3 = r#""get_time", "parameters": {"timezone": "UTC"}}"#;
-    let result3 = parser.parse_incremental(chunk3, &mut state).await.unwrap();
-    match result3 {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_time");
+    let result3 = parser.parse_incremental(chunk3, &tools).await.unwrap();
+    if !result3.calls.is_empty() {
+        if let Some(name) = &result3.calls[0].name {
+            assert_eq!(name, "get_time");
        }
-        _ => panic!("Expected tool to be complete, got: {:?}", result3),
    }
 }
--- a/sgl-router/tests/tool_parser_mixed_edge_cases.rs
+++ b/sgl-router/tests/tool_parser_mixed_edge_cases.rs
@@ -4,10 +4,12 @@

 use serde_json::json;
 use sglang_router_rs::tool_parser::{
-    JsonParser, LlamaParser, MistralParser, ParseState, PythonicParser, QwenParser, StreamResult,
-    ToolParser,
+    JsonParser, LlamaParser, MistralParser, PythonicParser, QwenParser, ToolParser,
 };

+mod common;
+use common::create_test_tools;
+
 #[tokio::test]
 async fn test_mixed_formats_in_text() {
    let json_parser = JsonParser::new();
@@ -152,25 +154,22 @@ async fn test_special_json_values() {

 #[tokio::test]
 async fn test_parser_recovery_after_invalid_input() {
-    let mut state = ParseState::new();
-    let parser = JsonParser::new();
+    let mut parser = JsonParser::new();
+    let tools = create_test_tools();

    // Send invalid JSON first
-    let _ = parser.parse_incremental(r#"{"broken": "#, &mut state).await;
+    let _ = parser.parse_incremental(r#"{"broken": "#, &tools).await;

-    // Clear state and try valid JSON
-    state.buffer.clear();
-    let result = parser
-        .parse_incremental(r#"{"name": "valid", "arguments": {}}"#, &mut state)
+    // Create a new parser instance for clean state
+    let mut parser2 = JsonParser::new();
+    let result = parser2
+        .parse_incremental(r#"{"name": "valid", "arguments": {}}"#, &tools)
        .await
        .unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "valid");
-        }
-        _ => {
-            // Might be incomplete depending on implementation
+    if !result.calls.is_empty() {
+        if let Some(name) = &result.calls[0].name {
+            assert_eq!(name, "valid");
        }
    }
 }
--- a/sgl-router/tests/tool_parser_pythonic.rs
+++ b/sgl-router/tests/tool_parser_pythonic.rs
@@ -5,6 +5,9 @@
 use serde_json::json;
 use sglang_router_rs::tool_parser::{PythonicParser, ToolParser};

+mod common;
+use common::create_test_tools;
+
 #[tokio::test]
 async fn test_pythonic_single_function() {
    let parser = PythonicParser::new();
@@ -246,260 +249,231 @@ async fn test_pythonic_complex_nesting() {

 #[tokio::test]
 async fn test_parse_streaming_no_brackets() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "This is just normal text without any tool calls.";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::Incomplete => {
-            // Expected - no tool calls found
-            assert_eq!(state.buffer, text);
-        }
-        _ => panic!("Should return Incomplete for text without tool calls"),
-    }
+    // Expected - no tool calls found
+    assert!(result.calls.is_empty());
 }

 #[tokio::test]
 async fn test_parse_streaming_complete_tool_call() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "Here's a tool call: [get_weather(location='New York', unit='celsius')]";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "New York");
-            assert_eq!(args["unit"], "celsius");
-            assert_eq!(state.buffer, "");
-        }
-        _ => panic!("Should return ToolComplete for complete tool call"),
-    }
+    assert!(!result.calls.is_empty(), "Should parse complete tool call");
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "get_weather");
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["location"], "New York");
+    assert_eq!(args["unit"], "celsius");
 }

 #[tokio::test]
 async fn test_parse_streaming_text_before_tool_call() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "This is some text before [get_weather(location='London')]";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "London");
-        }
-        _ => panic!("Should return ToolComplete"),
-    }
+    assert!(!result.calls.is_empty(), "Should parse tool call");
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "get_weather");
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["location"], "London");
 }

 #[tokio::test]
 async fn test_parse_streaming_partial_tool_call() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    // First chunk with opening bracket but no closing bracket
    let text1 = "Let me check the weather: [get_weather(location=";
-    let result1 = parser.parse_incremental(text1, &mut state).await.unwrap();
+    let result1 = parser.parse_incremental(text1, &tools).await.unwrap();

-    match result1 {
-        sglang_router_rs::tool_parser::StreamResult::Incomplete => {
-            assert!(state.buffer.contains("[get_weather(location="));
-        }
-        _ => panic!("First chunk should return Incomplete"),
-    }
+    // First chunk should be incomplete
+    assert!(
+        result1.calls.is_empty(),
+        "First chunk should not return tool call"
+    );

    // Second chunk completing the tool call
    let text2 = "'Paris')]";
-    let result2 = parser.parse_incremental(text2, &mut state).await.unwrap();
+    let result2 = parser.parse_incremental(text2, &tools).await.unwrap();

-    match result2 {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "Paris");
-            assert_eq!(state.buffer, "");
-        }
-        _ => panic!("Second chunk should return ToolComplete"),
-    }
+    assert!(
+        !result2.calls.is_empty(),
+        "Second chunk should complete tool call"
+    );
+    assert_eq!(result2.calls[0].name.as_ref().unwrap(), "get_weather");
+    let args: serde_json::Value = serde_json::from_str(&result2.calls[0].parameters).unwrap();
+    assert_eq!(args["location"], "Paris");
 }

 #[tokio::test]
 async fn test_parse_streaming_bracket_without_text_before() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "[search(query='python programming')]";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "search");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["query"], "python programming");
-        }
-        _ => panic!("Should return ToolComplete"),
-    }
+    assert!(!result.calls.is_empty(), "Should parse tool call");
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "search");
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["query"], "python programming");
 }

 #[tokio::test]
 async fn test_parse_streaming_text_after_tool_call() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    // First chunk with complete tool call and some text after
    let text = "[get_weather(location='Tokyo')] Here's the forecast:";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            // Text after tool call should remain in buffer
-            // Note: Current implementation may clear buffer, this behavior needs verification
-        }
-        _ => panic!("Should return ToolComplete"),
-    }
+    assert!(!result.calls.is_empty(), "Should parse tool call");
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "get_weather");
+    // Text after tool call is handled by parser internally
 }

 #[tokio::test]
 async fn test_parse_streaming_multiple_tool_calls() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "[get_weather(location='Berlin'), search(query='restaurants')]";

    // Current implementation may handle this as a single parse
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

    // The parser should handle multiple tools in one bracket pair
-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(_) => {
-            // Expected behavior - parses first tool
-        }
-        _ => {
-            // Also acceptable if it returns Incomplete waiting for more
-        }
+    // This test is flexible about the implementation behavior
+    if !result.calls.is_empty() {
+        // Parser found at least one tool
+        assert!(result.calls[0].name.is_some());
    }
+    // Also acceptable if parser returns empty waiting for more context
 }

 #[tokio::test]
 async fn test_parse_streaming_opening_bracket_only() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "Let's try this: [";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::Incomplete => {
-            assert!(state.buffer.ends_with("["));
-        }
-        _ => panic!("Should return Incomplete for partial bracket"),
-    }
+    // Should be incomplete - no complete tool call
+    assert!(
+        result.calls.is_empty(),
+        "Should not return tool call for partial bracket"
+    );
 }

 #[tokio::test]
 async fn test_parse_streaming_nested_brackets() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text = "[get_weather(location='New York', unit='celsius', data=[1, 2, 3])]";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "New York");
-            assert_eq!(args["unit"], "celsius");
-            assert_eq!(args["data"], json!([1, 2, 3]));
-        }
-        _ => panic!("Should return ToolComplete"),
-    }
+    assert!(
+        !result.calls.is_empty(),
+        "Should parse tool call with nested brackets"
+    );
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "get_weather");
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["location"], "New York");
+    assert_eq!(args["unit"], "celsius");
+    assert_eq!(args["data"], json!([1, 2, 3]));
 }

 #[tokio::test]
 async fn test_parse_streaming_nested_brackets_dict() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+    let tools = create_test_tools();

    let text = r#"[search(query='test', config={'options': [1, 2], 'nested': {'key': 'value'}})]"#;
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "search");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["query"], "test");
-            assert_eq!(args["config"]["options"], json!([1, 2]));
-            assert_eq!(args["config"]["nested"]["key"], "value");
-        }
-        _ => panic!("Should return ToolComplete"),
-    }
+    assert!(
+        !result.calls.is_empty(),
+        "Should parse tool call with nested dict"
+    );
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "search");
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["query"], "test");
+    assert_eq!(args["config"]["options"], json!([1, 2]));
+    assert_eq!(args["config"]["nested"]["key"], "value");
 }

 #[tokio::test]
 async fn test_parse_streaming_multiple_tools_with_nested_brackets() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let text =
        "[get_weather(location='Paris', data=[10, 20]), search(query='test', filters=['a', 'b'])]";
-    let result = parser.parse_incremental(text, &mut state).await.unwrap();
+    let result = parser.parse_incremental(text, &tools).await.unwrap();

-    // Should parse both tools successfully
-    match result {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            // At least gets the first tool
-            assert_eq!(tool.function.name, "get_weather");
-        }
-        _ => panic!("Should return ToolComplete"),
+    // Should parse tools successfully
+    if !result.calls.is_empty() {
+        // At least gets the first tool
+        assert!(result.calls[0].name.is_some());
    }
 }

 #[tokio::test]
 async fn test_parse_streaming_partial_nested_brackets() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    // First chunk with nested brackets but incomplete
    let text1 = "Here's a call: [get_weather(location='Tokyo', data=[1, 2";
-    let result1 = parser.parse_incremental(text1, &mut state).await.unwrap();
+    let result1 = parser.parse_incremental(text1, &tools).await.unwrap();

-    match result1 {
-        sglang_router_rs::tool_parser::StreamResult::Incomplete => {
-            assert!(state
-                .buffer
-                .contains("[get_weather(location='Tokyo', data=[1, 2"));
-        }
-        _ => panic!("First chunk should return Incomplete"),
-    }
+    // First chunk should be incomplete
+    assert!(result1.calls.is_empty(), "First chunk should not complete");

    // Second chunk completing the nested brackets
    let text2 = ", 3])]";
-    let result2 = parser.parse_incremental(text2, &mut state).await.unwrap();
+    let result2 = parser.parse_incremental(text2, &tools).await.unwrap();

-    match result2 {
-        sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "Tokyo");
-            assert_eq!(args["data"], json!([1, 2, 3]));
-        }
-        _ => panic!("Second chunk should return ToolComplete"),
-    }
+    assert!(
+        !result2.calls.is_empty(),
+        "Second chunk should complete tool call"
+    );
+    assert_eq!(result2.calls[0].name.as_ref().unwrap(), "get_weather");
+    let args: serde_json::Value = serde_json::from_str(&result2.calls[0].parameters).unwrap();
+    assert_eq!(args["location"], "Tokyo");
+    assert_eq!(args["data"], json!([1, 2, 3]));
 }

 #[tokio::test]
 async fn test_parse_streaming_with_python_start_and_end_token() {
-    let parser = PythonicParser::new();
-    let mut state = sglang_router_rs::tool_parser::ParseState::new();
+    let mut parser = PythonicParser::new();
+
+    let tools = create_test_tools();

    let chunks = vec![
        "Here's a call: ",
@@ -512,13 +486,16 @@ async fn test_parse_streaming_with_python_start_and_end_token() {
    let mut got_tool = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let sglang_router_rs::tool_parser::StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["location"], "Tokyo");
-            assert_eq!(args["data"], json!([1, 2, 3]));
-            got_tool = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
+                assert_eq!(name, "get_weather");
+                let args: serde_json::Value =
+                    serde_json::from_str(&result.calls[0].parameters).unwrap();
+                assert_eq!(args["location"], "Tokyo");
+                assert_eq!(args["data"], json!([1, 2, 3]));
+                got_tool = true;
+            }
        }
    }

--- a/sgl-router/tests/tool_parser_qwen.rs
+++ b/sgl-router/tests/tool_parser_qwen.rs
@@ -3,7 +3,10 @@
 //! Tests for the Qwen parser which handles <tool_call>...</tool_call> format

 use serde_json::json;
-use sglang_router_rs::tool_parser::{ParseState, QwenParser, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{QwenParser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_qwen_single_tool() {
@@ -189,43 +192,43 @@ These tools will provide the information you need."#;

 #[tokio::test]
 async fn test_buffer_drain_optimization() {
-    let parser = QwenParser::new();
-    let mut state = ParseState::new();
+    let mut parser = QwenParser::new();
+
+    let tools = create_test_tools();

    // First chunk - incomplete tool call
    let chunk1 = "<tool_call>\n{\"name\": \"test1\", ";
-    let _result = parser.parse_incremental(chunk1, &mut state).await.unwrap();
+    let _result = parser.parse_incremental(chunk1, &tools).await.unwrap();
    // The important thing is buffer accumulation works
-    assert!(!state.buffer.is_empty());

    // Complete first tool and start second
    let chunk2 = "\"arguments\": {}}\n</tool_call><tool_call>\n{\"name\": \"test2\", ";
-    let result = parser.parse_incremental(chunk2, &mut state).await.unwrap();
+    let result = parser.parse_incremental(chunk2, &tools).await.unwrap();

-    if let StreamResult::ToolComplete(tool) = result {
-        assert_eq!(tool.function.name, "test1");
-        // After consuming the first tool, buffer should contain only the second tool start
-        assert!(state.buffer.starts_with("<tool_call>"));
-        assert!(state.buffer.contains("test2"));
-    } else {
-        // The important thing is the buffer is managed correctly
+    if !result.calls.is_empty() {
+        if let Some(_name) = &result.calls[0].name {
+            assert_eq!(result.calls[0].name.as_ref().unwrap(), "test1");
+            // After consuming the first tool, buffer is managed internally
+        }
    }

    // Complete the second tool
    let chunk3 = "\"arguments\": {\"x\": 1}}\n</tool_call>";
-    let result = parser.parse_incremental(chunk3, &mut state).await.unwrap();
+    let result = parser.parse_incremental(chunk3, &tools).await.unwrap();

-    if let StreamResult::ToolComplete(tool) = result {
-        assert_eq!(tool.function.name, "test2");
-        // Buffer should be empty after consuming all tools
-        assert!(state.buffer.is_empty() || !state.buffer.contains("</tool_call>"));
+    if !result.calls.is_empty() {
+        if let Some(_name) = &result.calls[0].name {
+            assert_eq!(result.calls[0].name.as_ref().unwrap(), "test2");
+            // Buffer is managed internally
+        }
    }
 }

 #[tokio::test]
 async fn test_buffer_efficiency_with_multiple_tools() {
-    let parser = QwenParser::new();
-    let mut state = ParseState::new();
+    let mut parser = QwenParser::new();
+
+    let tools = create_test_tools();

    // Send multiple complete tools at once
    let input = r#"<tool_call>
@@ -237,16 +240,13 @@ async fn test_buffer_efficiency_with_multiple_tools() {
 </tool_call>"#;

    // This should efficiently process tools using drain() without creating new strings
-    let result = parser.parse_incremental(input, &mut state).await.unwrap();
+    let result = parser.parse_incremental(input, &tools).await.unwrap();

    // In Phase 2, this will likely parse only the first tool
    // The important thing is that drain() doesn't cause any issues
-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert!(["tool1", "tool2", "tool3"].contains(&tool.function.name.as_str()));
-        }
-        _ => {
-            // Simplified streaming might return Incomplete
+    if !result.calls.is_empty() {
+        if let Some(name) = &result.calls[0].name {
+            assert!(["tool1", "tool2", "tool3"].contains(&name.as_str()));
        }
    }
 }
--- a/sgl-router/tests/tool_parser_registry.rs
+++ b/sgl-router/tests/tool_parser_registry.rs
@@ -1,192 +0,0 @@
-//! Parser Registry Integration Tests
-//!
-//! Tests for model-to-parser mappings and registry functionality
-
-use sglang_router_rs::tool_parser::ParserRegistry;
-
-#[tokio::test]
-async fn test_registry_has_all_parsers() {
-    let registry = ParserRegistry::new();
-    let parsers = registry.list_parsers();
-
-    assert!(parsers.contains(&"json"));
-    assert!(parsers.contains(&"mistral"));
-    assert!(parsers.contains(&"qwen"));
-    assert!(parsers.contains(&"pythonic"));
-    assert!(parsers.contains(&"llama"));
-}
-
-#[tokio::test]
-async fn test_openai_models_use_json() {
-    let registry = ParserRegistry::new();
-
-    let models = vec!["gpt-4", "gpt-4-turbo", "gpt-3.5-turbo", "gpt-4o"];
-    for model in models {
-        let parser = registry.get_parser(model).unwrap();
-        let test_input = r#"{"name": "test", "arguments": {}}"#;
-        let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-        assert_eq!(tools.len(), 1);
-        assert_eq!(tools[0].function.name, "test");
-    }
-}
-
-#[tokio::test]
-async fn test_anthropic_models_use_json() {
-    let registry = ParserRegistry::new();
-
-    let models = vec!["claude-3-opus", "claude-3-sonnet", "claude-2.1"];
-    for model in models {
-        let parser = registry.get_parser(model).unwrap();
-        let test_input = r#"{"name": "test", "arguments": {}}"#;
-        let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-        assert_eq!(tools.len(), 1);
-    }
-}
-
-#[tokio::test]
-async fn test_mistral_models() {
-    let registry = ParserRegistry::new();
-
-    let models = vec!["mistral-large", "mistral-medium", "mixtral-8x7b"];
-    for model in models {
-        let parser = registry.get_parser(model).unwrap();
-        let test_input = r#"[TOOL_CALLS] [{"name": "test", "arguments": {}}]"#;
-        let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-        assert_eq!(tools.len(), 1);
-        assert_eq!(tools[0].function.name, "test");
-    }
-}
-
-#[tokio::test]
-async fn test_qwen_models() {
-    let registry = ParserRegistry::new();
-
-    let models = vec!["qwen2.5-72b", "Qwen2-7B", "qwen-max"];
-    for model in models {
-        let parser = registry.get_parser(model).unwrap();
-        let test_input = r#"<tool_call>
-{"name": "test", "arguments": {}}
-</tool_call>"#;
-        let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-        assert_eq!(tools.len(), 1);
-        assert_eq!(tools[0].function.name, "test");
-    }
-}
-
-#[tokio::test]
-async fn test_llama_model_variants() {
-    let registry = ParserRegistry::new();
-
-    // Llama 4 uses pythonic
-    let parser = registry.get_parser("llama-4-70b").unwrap();
-    let test_input = r#"[get_weather(city="NYC")]"#;
-    let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-    assert_eq!(tools.len(), 1);
-    assert_eq!(tools[0].function.name, "get_weather");
-
-    // Llama 3.2 uses python_tag
-    let parser = registry.get_parser("llama-3.2-8b").unwrap();
-    let test_input = r#"<|python_tag|>{"name": "test", "arguments": {}}"#;
-    let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-    assert_eq!(tools.len(), 1);
-    assert_eq!(tools[0].function.name, "test");
-
-    // Other Llama models use JSON
-    let parser = registry.get_parser("llama-2-70b").unwrap();
-    let test_input = r#"{"name": "test", "arguments": {}}"#;
-    let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-    assert_eq!(tools.len(), 1);
-}
-
-#[tokio::test]
-async fn test_deepseek_models() {
-    let registry = ParserRegistry::new();
-
-    // DeepSeek uses pythonic format (simplified, v3 would need custom parser)
-    let parser = registry.get_parser("deepseek-coder").unwrap();
-    let test_input = r#"[function(arg="value")]"#;
-    let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-    assert_eq!(tools.len(), 1);
-    assert_eq!(tools[0].function.name, "function");
-}
-
-#[tokio::test]
-async fn test_unknown_model_fallback() {
-    let registry = ParserRegistry::new();
-
-    // Unknown models should fall back to JSON parser
-    let parser = registry.get_parser("unknown-model-xyz").unwrap();
-    let test_input = r#"{"name": "fallback", "arguments": {}}"#;
-    let (_normal_text, tools) = parser.parse_complete(test_input).await.unwrap();
-    assert_eq!(tools.len(), 1);
-    assert_eq!(tools[0].function.name, "fallback");
-}
-
-#[tokio::test]
-async fn test_pattern_specificity() {
-    let registry = ParserRegistry::new();
-
-    // llama-4* should match before llama-*
-    let parser = registry.get_parser("llama-4-70b").unwrap();
-    assert!(parser.detect_format(r#"[test_function(x=1)]"#)); // Pythonic format
-
-    let parser = registry.get_parser("llama-3-70b").unwrap();
-    assert!(parser.detect_format(r#"{"name": "test", "arguments": {}}"#)); // JSON format
-}
-
-#[tokio::test]
-async fn test_real_world_model_outputs() {
-    let registry = ParserRegistry::new();
-
-    let test_cases = vec![
-        (
-            "gpt-4",
-            r#"I'll help you with that.
-
-{"name": "search_web", "arguments": {"query": "latest AI news", "max_results": 5}}
-
-Let me search for that information."#,
-            "search_web",
-        ),
-        (
-            "mistral-large",
-            r#"Let me search for information about Rust.
-
-[TOOL_CALLS] [
-    {"name": "search", "arguments": {"query": "Rust programming"}},
-    {"name": "get_weather", "arguments": {"city": "San Francisco"}}
-]
-
-I've initiated the search."#,
-            "search",
-        ),
-        (
-            "qwen2.5",
-            r#"I'll check the weather for you.
-
-<tool_call>
-{
-    "name": "get_weather",
-    "arguments": {
-        "location": "Tokyo",
-        "units": "celsius"
-    }
-}
-</tool_call>
-
-The weather information has been requested."#,
-            "get_weather",
-        ),
-    ];
-
-    for (model, output, expected_name) in test_cases {
-        let parser = registry.get_parser(model).unwrap();
-        let (_normal_text, tools) = parser.parse_complete(output).await.unwrap();
-        assert!(!tools.is_empty(), "No tools parsed for model {}", model);
-        assert_eq!(
-            tools[0].function.name, expected_name,
-            "Wrong function name for model {}",
-            model
-        );
-    }
-}
--- a/sgl-router/tests/tool_parser_step3.rs
+++ b/sgl-router/tests/tool_parser_step3.rs
@@ -1,6 +1,9 @@
 //! Step3 Parser Integration Tests

-use sglang_router_rs::tool_parser::{ParseState, Step3Parser, StreamResult, ToolParser};
+use sglang_router_rs::tool_parser::{Step3Parser, ToolParser};
+
+mod common;
+use common::create_test_tools;

 #[tokio::test]
 async fn test_step3_complete_parsing() {
@@ -72,8 +75,9 @@ async fn test_step3_type_conversion() {

 #[tokio::test]
 async fn test_step3_streaming() {
-    let parser = Step3Parser::new();
-    let mut state = ParseState::new();
+    let mut parser = Step3Parser::new();
+
+    let tools = create_test_tools();

    // Simulate streaming chunks
    let chunks = vec![
@@ -86,26 +90,20 @@ async fn test_step3_streaming() {
        "\n<｜tool_calls_end｜>",
    ];

-    let mut found_name = false;
    let mut found_complete = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();

-        match result {
-            StreamResult::ToolName { name, .. } => {
+        if !result.calls.is_empty() {
+            if let Some(name) = &result.calls[0].name {
                assert_eq!(name, "calc");
-                found_name = true;
-            }
-            StreamResult::ToolComplete(tool) => {
-                assert_eq!(tool.function.name, "calc");
                found_complete = true;
            }
-            _ => {}
        }
    }

-    assert!(found_name || found_complete);
+    assert!(found_complete);
 }

 #[test]
--- a/sgl-router/tests/tool_parser_streaming.rs
+++ b/sgl-router/tests/tool_parser_streaming.rs
@@ -3,36 +3,31 @@
 //! Tests for incremental/streaming parsing capabilities across all parsers

 use sglang_router_rs::tool_parser::{
-    JsonParser, LlamaParser, MistralParser, ParseState, PythonicParser, QwenParser, StreamResult,
-    ToolParser,
+    JsonParser, LlamaParser, MistralParser, PythonicParser, QwenParser, ToolParser,
 };

+mod common;
+use common::create_test_tools;
+
 #[tokio::test]
 async fn test_json_streaming_simple() {
-    let parser = JsonParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = JsonParser::new();

    let full_json = r#"{"name": "get_weather", "arguments": {"location": "San Francisco"}}"#;

-    let result = parser
-        .parse_incremental(full_json, &mut state)
-        .await
-        .unwrap();
+    let result = parser.parse_incremental(full_json, &tools).await.unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-        }
-        _ => {
-            panic!("Expected ToolComplete for complete JSON input");
-        }
-    }
+    assert!(!result.calls.is_empty(), "Should have parsed a tool call");
+    assert_eq!(result.calls[0].name, Some("get_weather".to_string()));
 }

 #[tokio::test]
 async fn test_json_streaming_array() {
-    let parser = JsonParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = JsonParser::new();

    let chunks = vec![
        r#"["#,
@@ -46,9 +41,11 @@ async fn test_json_streaming_array() {
    let mut tool_count = 0;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let StreamResult::ToolComplete(_) = result {
-            tool_count += 1;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        for call in result.calls {
+            if call.name.is_some() {
+                tool_count += 1;
+            }
        }
    }

@@ -58,8 +55,9 @@ async fn test_json_streaming_array() {

 #[tokio::test]
 async fn test_mistral_streaming() {
-    let parser = MistralParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = MistralParser::new();

    let chunks = vec![
        r#"Here is the result: "#,
@@ -72,47 +70,42 @@ async fn test_mistral_streaming() {
        r#"}}]"#,
    ];

-    let mut got_complete = false;
+    let mut got_tool_name = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "search");
-            got_complete = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        for call in result.calls {
+            if let Some(name) = call.name {
+                assert_eq!(name, "search");
+                got_tool_name = true;
+            }
        }
    }

-    assert!(got_complete, "Should have completed parsing");
+    assert!(got_tool_name, "Should have found tool name");
 }

 #[tokio::test]
 async fn test_pythonic_streaming() {
-    let parser = PythonicParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = PythonicParser::new();

    let full_input = r#"[get_weather(city="London", units="celsius")]"#;

-    let result = parser
-        .parse_incremental(full_input, &mut state)
-        .await
-        .unwrap();
+    let result = parser.parse_incremental(full_input, &tools).await.unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "get_weather");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert_eq!(args["city"], "London");
-        }
-        _ => {
-            panic!("Expected ToolComplete for complete pythonic input");
-        }
-    }
+    assert!(!result.calls.is_empty(), "Should have parsed a tool call");
+    assert_eq!(result.calls[0].name, Some("get_weather".to_string()));
+    let args: serde_json::Value = serde_json::from_str(&result.calls[0].parameters).unwrap();
+    assert_eq!(args["city"], "London");
 }

 #[tokio::test]
 async fn test_llama_streaming_with_python_tag() {
-    let parser = LlamaParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = LlamaParser::new();

    let chunks = vec![
        r#"Let me help. "#,
@@ -125,194 +118,197 @@ async fn test_llama_streaming_with_python_tag() {
        r#"}"#,
    ];

-    let mut got_complete = false;
+    let mut got_tool_name = false;

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
-        if let StreamResult::ToolComplete(tool) = result {
-            assert_eq!(tool.function.name, "calculate");
-            got_complete = true;
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
+        for call in result.calls {
+            if let Some(name) = call.name {
+                assert_eq!(name, "calculate");
+                got_tool_name = true;
+            }
        }
    }

-    assert!(got_complete, "Should have completed parsing");
+    assert!(got_tool_name, "Should have found tool name");
 }

 #[tokio::test]
 async fn test_qwen_streaming() {
-    let parser = QwenParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = QwenParser::new();

    // Note: Parser expects newline after both tags
    let full_input = "<tool_call>\n{\"name\": \"translate\", \"arguments\": {\"text\": \"hello\", \"to\": \"zh\"}}\n</tool_call>";

-    let result = parser
-        .parse_incremental(full_input, &mut state)
-        .await
-        .unwrap();
+    let result = parser.parse_incremental(full_input, &tools).await.unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "translate");
-        }
-        other => {
-            panic!(
-                "Expected ToolComplete for complete Qwen input, got: {:?}",
-                other
-            );
-        }
-    }
+    assert!(!result.calls.is_empty(), "Should have parsed a tool call");
+    assert_eq!(result.calls[0].name, Some("translate".to_string()));
 }

 #[tokio::test]
 async fn test_streaming_incomplete_stays_incomplete() {
-    let parser = JsonParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = JsonParser::new();

    let chunks = vec![r#"{"na"#, r#"me": "#];

    for chunk in chunks {
-        let result = parser.parse_incremental(chunk, &mut state).await.unwrap();
+        let result = parser.parse_incremental(chunk, &tools).await.unwrap();
        assert!(
-            matches!(result, StreamResult::Incomplete),
-            "Should return Incomplete for partial JSON, got: {:?}",
+            result.calls.is_empty(),
+            "Should return empty calls for partial JSON, got: {:?}",
            result
        );
    }
-
-    assert!(!state.buffer.is_empty());
-}
-
-#[tokio::test]
-async fn test_streaming_with_text_before_tool() {
-    let parser = JsonParser::new();
-    let mut state = ParseState::new();
-
-    let full_input = r#"{"name": "test", "arguments": {}}"#;
-
-    let result = parser
-        .parse_incremental(full_input, &mut state)
-        .await
-        .unwrap();
-
-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "test");
-        }
-        other => {
-            panic!("Expected ToolComplete, got: {:?}", other);
-        }
-    }
 }

 #[tokio::test]
 async fn test_streaming_buffer_accumulation() {
-    let parser = JsonParser::new();
+    let tools = create_test_tools();

-    let mut state = ParseState::new();
+    let mut parser = JsonParser::new();

-    let result1 = parser
-        .parse_incremental(r#"{"na"#, &mut state)
-        .await
-        .unwrap();
+    let result1 = parser.parse_incremental(r#"{"na"#, &tools).await.unwrap();

-    assert!(matches!(result1, StreamResult::Incomplete));
-    assert!(
-        !state.buffer.is_empty(),
-        "Buffer should accumulate incomplete JSON"
-    );
+    assert!(result1.calls.is_empty(), "Should not parse incomplete JSON");

    let result2 = parser
-        .parse_incremental(r#"me": "test", "arguments": {}}"#, &mut state)
+        .parse_incremental(r#"me": "test", "arguments": {}}"#, &tools)
        .await
        .unwrap();

-    match result2 {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "test");
-            assert!(
-                state.buffer.is_empty(),
-                "Buffer should be cleared after complete parse"
-            );
-        }
-        _ => panic!(
-            "Expected ToolComplete for complete JSON, got: {:?}",
-            result2
-        ),
-    }
+    assert!(
+        !result2.calls.is_empty(),
+        "Should parse complete JSON after buffering"
+    );
+    assert_eq!(result2.calls[0].name, Some("test".to_string()));
 }

 #[tokio::test]
 async fn test_streaming_multiple_tools_sequential() {
-    let parser = QwenParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = QwenParser::new();

    let full_input = r#"<tool_call>
 {"name": "tool1", "arguments": {}}
 </tool_call>"#;

-    let result = parser
-        .parse_incremental(full_input, &mut state)
-        .await
-        .unwrap();
+    let result = parser.parse_incremental(full_input, &tools).await.unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "tool1");
-        }
-        _ => {
-            panic!("Expected ToolComplete for first tool");
-        }
-    }
+    assert!(!result.calls.is_empty(), "Should have parsed a tool call");
+    assert_eq!(result.calls[0].name, Some("tool1".to_string()));
 }

 #[tokio::test]
 async fn test_streaming_reset_after_error() {
-    let parser = JsonParser::new();
+    let tools = create_test_tools();

-    let mut state1 = ParseState::new();
-    let _ = parser
-        .parse_incremental(r#"{"name": invalid}"#, &mut state1)
+    let mut parser1 = JsonParser::new();
+
+    let _ = parser1
+        .parse_incremental(r#"{"name": invalid}"#, &tools)
        .await;

-    let mut state2 = ParseState::new();
-    let result = parser
-        .parse_incremental(r#"{"name": "test", "arguments": {}}"#, &mut state2)
+    // Use a new parser instance for clean state
+    let mut parser2 = JsonParser::new();
+    let result = parser2
+        .parse_incremental(r#"{"name": "test", "arguments": {}}"#, &tools)
        .await
        .unwrap();

-    if let StreamResult::ToolComplete(tool) = result {
-        assert_eq!(tool.function.name, "test");
-    }
+    assert!(!result.calls.is_empty(), "Should parse valid JSON");
+    assert_eq!(result.calls[0].name, Some("test".to_string()));
 }

 #[tokio::test]
 async fn test_streaming_with_unicode_chunks() {
-    let parser = JsonParser::new();
-    let mut state = ParseState::new();
+    let tools = create_test_tools();
+
+    let mut parser = JsonParser::new();

    let full_input = r#"{"name": "translate", "arguments": {"text": "Hello 世界 🌍"}}"#;

-    let result = parser
-        .parse_incremental(full_input, &mut state)
+    let result = parser.parse_incremental(full_input, &tools).await.unwrap();
+
+    assert!(!result.calls.is_empty(), "Should have parsed a tool call");
+
+    // Check if we got the tool name
+    if let Some(name) = &result.calls[0].name {
+        assert_eq!(name, "translate");
+    }
+
+    // In streaming mode, need to make another call to get parameters
+    let result2 = parser.parse_incremental("", &tools).await.unwrap();
+
+    // Parameters should be in either result.calls[1] or result2.calls[0]
+    let params = if result.calls.len() > 1 {
+        &result.calls[1].parameters
+    } else if !result2.calls.is_empty() {
+        &result2.calls[0].parameters
+    } else {
+        &result.calls[0].parameters
+    };
+
+    if !params.is_empty() {
+        let args: serde_json::Value = serde_json::from_str(params).unwrap();
+        assert!(args["text"].as_str().unwrap().contains("世界"));
+    }
+}
+
+#[tokio::test]
+async fn test_streaming_with_partial_chunks() {
+    let mut parser = JsonParser::new();
+    let tools = create_test_tools();
+
+    let partial = r#"{"#;
+    let result = parser.parse_incremental(partial, &tools).await.unwrap();
+    assert!(
+        result.calls.is_empty(),
+        "Should return empty calls for just opening brace"
+    );
+
+    let mut parser2 = JsonParser::new();
+    let complete = r#"{"name": "get_weather", "arguments": {"location": "SF"}}"#;
+    let result = parser2.parse_incremental(complete, &tools).await.unwrap();
+
+    assert!(
+        !result.calls.is_empty(),
+        "Expected tool call for complete JSON"
+    );
+    assert_eq!(result.calls[0].name.as_ref().unwrap(), "get_weather");
+
+    // In streaming mode, need to make another call to get parameters
+    let result2 = parser2.parse_incremental("", &tools).await.unwrap();
+
+    // Parameters should be in either result.calls[1] or result2.calls[0]
+    let params = if result.calls.len() > 1 {
+        &result.calls[1].parameters
+    } else if !result2.calls.is_empty() {
+        &result2.calls[0].parameters
+    } else {
+        &result.calls[0].parameters
+    };
+
+    if !params.is_empty() {
+        let args: serde_json::Value = serde_json::from_str(params).unwrap();
+        assert_eq!(args["location"], "SF");
+    }
+
+    // The PartialJson parser can complete partial JSON by filling in missing values
+    let mut parser3 = JsonParser::new();
+    let partial_with_name = r#"{"name": "test", "argum"#;
+    let result = parser3
+        .parse_incremental(partial_with_name, &tools)
        .await
        .unwrap();

-    match result {
-        StreamResult::ToolComplete(tool) => {
-            assert_eq!(tool.function.name, "translate");
-            let args: serde_json::Value = serde_json::from_str(&tool.function.arguments).unwrap();
-            assert!(args["text"].as_str().unwrap().contains("世界"));
-        }
-        StreamResult::ToolName { name, .. } => {
-            assert_eq!(name, "translate");
-        }
-        StreamResult::ToolArguments { arguments, .. } => {
-            let args: serde_json::Value = serde_json::from_str(&arguments).unwrap();
-            assert!(args["text"].as_str().unwrap().contains("世界"));
-        }
-        other => {
-            panic!("Unexpected result: {:?}", other);
-        }
+    // Parser behavior may vary - either complete with partial data or wait for more
+    if !result.calls.is_empty() {
+        assert_eq!(result.calls[0].name.as_ref().unwrap(), "test");
    }
 }