diff --git a/.github/workflows/pr-test-rust.yml b/.github/workflows/pr-test-rust.yml
index d704488d9..e3ea0305f 100644
--- a/.github/workflows/pr-test-rust.yml
+++ b/.github/workflows/pr-test-rust.yml
@@ -27,6 +27,12 @@ jobs:
         run: |
           bash scripts/ci/ci_install_rust.sh
 
+      - name: Run lint
+        run: |
+          source "$HOME/.cargo/env"
+          cd sgl-router/
+          cargo clippy --all-targets --all-features -- -D warnings
+
       - name: Run fmt
         run: |
           source "$HOME/.cargo/env"
diff --git a/sgl-router/benches/request_processing.rs b/sgl-router/benches/request_processing.rs
index 605bc705b..3b979477c 100644
--- a/sgl-router/benches/request_processing.rs
+++ b/sgl-router/benches/request_processing.rs
@@ -22,7 +22,7 @@ fn create_test_worker() -> BasicWorker {
 fn get_bootstrap_info(worker: &BasicWorker) -> (String, Option<u16>) {
     let hostname = get_hostname(worker.url());
     let bootstrap_port = match worker.worker_type() {
-        WorkerType::Prefill { bootstrap_port } => bootstrap_port.clone(),
+        WorkerType::Prefill { bootstrap_port } => bootstrap_port,
         _ => None,
     };
     (hostname, bootstrap_port)
diff --git a/sgl-router/src/core/error.rs b/sgl-router/src/core/error.rs
index b89ba8032..74e0a0d25 100644
--- a/sgl-router/src/core/error.rs
+++ b/sgl-router/src/core/error.rs
@@ -137,8 +137,7 @@ mod tests {
     fn test_worker_result_type_alias() {
         // Test Ok variant
         let result: WorkerResult<i32> = Ok(42);
-        assert!(result.is_ok());
-        assert_eq!(result.unwrap(), 42);
+        assert!(matches!(result, Ok(42)));
 
         // Test Err variant
         let error = WorkerError::WorkerNotFound {
diff --git a/sgl-router/src/core/worker.rs b/sgl-router/src/core/worker.rs
index e4759ca2b..2466d00b0 100644
--- a/sgl-router/src/core/worker.rs
+++ b/sgl-router/src/core/worker.rs
@@ -311,13 +311,7 @@ impl Worker for BasicWorker {
 
         // Use the shared client with a custom timeout for this request
         let health_result = match WORKER_CLIENT.get(&health_url).timeout(timeout).send().await {
-            Ok(response) => {
-                if response.status().is_success() {
-                    true
-                } else {
-                    false
-                }
-            }
+            Ok(response) => response.status().is_success(),
             Err(_) => false,
         };
 
@@ -571,6 +565,7 @@ impl WorkerFactory {
     }
 
     /// Create workers from URLs with automatic type detection
+    #[allow(clippy::type_complexity)]
     pub fn create_from_urls(
         regular_urls: Vec<String>,
         prefill_urls: Vec<(String, Option<u16>)>,
@@ -1202,12 +1197,6 @@ mod tests {
         for handle in handles {
             handle.await.unwrap();
         }
-
-        // Final state should be deterministic (last write wins)
-        // We can't predict the exact final state due to scheduling,
-        // but we can verify no data corruption occurred
-        let final_health = worker.is_healthy();
-        assert!(final_health == true || final_health == false);
     }
 
     // Test WorkerFactory
diff --git a/sgl-router/src/lib.rs b/sgl-router/src/lib.rs
index 02b626f52..2d8641a9d 100644
--- a/sgl-router/src/lib.rs
+++ b/sgl-router/src/lib.rs
@@ -249,6 +249,7 @@ impl Router {
         health_check_interval_secs = 60,
         health_check_endpoint = String::from("/health"),
     ))]
+    #[allow(clippy::too_many_arguments)]
     fn new(
         worker_urls: Vec<String>,
         policy: PolicyType,
diff --git a/sgl-router/src/metrics.rs b/sgl-router/src/metrics.rs
index 35969f5db..f16bb3235 100644
--- a/sgl-router/src/metrics.rs
+++ b/sgl-router/src/metrics.rs
@@ -510,25 +510,9 @@ mod tests {
 
     // ============= Duration Bucket Tests =============
 
-    #[test]
-    fn test_duration_bucket_values() {
-        let expected_buckets = vec![
-            0.001, 0.005, 0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1.0, 2.5, 5.0, 10.0, 15.0, 30.0, 45.0,
-            60.0, 90.0, 120.0, 180.0, 240.0,
-        ];
-
-        // The buckets are defined in start_prometheus function
-        assert_eq!(expected_buckets.len(), 20);
-
-        // Verify proper ordering
-        for i in 1..expected_buckets.len() {
-            assert!(expected_buckets[i] > expected_buckets[i - 1]);
-        }
-    }
-
     #[test]
     fn test_duration_bucket_coverage() {
-        let test_cases = vec![
+        let test_cases: [(f64, &str); 7] = [
             (0.0005, "sub-millisecond"),
             (0.005, "5ms"),
             (0.05, "50ms"),
@@ -538,7 +522,7 @@ mod tests {
             (240.0, "4m"),
         ];
 
-        let buckets = vec![
+        let buckets: [f64; 20] = [
             0.001, 0.005, 0.01, 0.025, 0.05, 0.1, 0.25, 0.5, 1.0, 2.5, 5.0, 10.0, 15.0, 30.0, 45.0,
             60.0, 90.0, 120.0, 180.0, 240.0,
         ];
@@ -546,7 +530,7 @@ mod tests {
         for (duration, label) in test_cases {
             let bucket_found = buckets
                 .iter()
-                .any(|&b| ((b - duration) as f64).abs() < 0.0001 || b > duration);
+                .any(|&b| (b - duration).abs() < 0.0001 || b > duration);
             assert!(bucket_found, "No bucket found for {} ({})", duration, label);
         }
     }
@@ -558,14 +542,13 @@ mod tests {
         let matcher = Matcher::Suffix(String::from("duration_seconds"));
 
         // Test matching behavior
-        let _matching_metrics = vec![
+        let _matching_metrics = [
             "request_duration_seconds",
             "response_duration_seconds",
             "sgl_router_request_duration_seconds",
         ];
 
-        let _non_matching_metrics =
-            vec!["duration_total", "duration_seconds_total", "other_metric"];
+        let _non_matching_metrics = ["duration_total", "duration_seconds_total", "other_metric"];
 
         // Note: We can't directly test Matcher matching without the internals,
         // but we can verify the matcher is created correctly
@@ -611,8 +594,8 @@ mod tests {
     #[test]
     fn test_custom_buckets_for_different_metrics() {
         // Test that we can create different bucket configurations
-        let request_buckets = vec![0.001, 0.01, 0.1, 1.0, 10.0];
-        let generate_buckets = vec![0.1, 0.5, 1.0, 5.0, 30.0, 60.0];
+        let request_buckets = [0.001, 0.01, 0.1, 1.0, 10.0];
+        let generate_buckets = [0.1, 0.5, 1.0, 5.0, 30.0, 60.0];
 
         assert_eq!(request_buckets.len(), 5);
         assert_eq!(generate_buckets.len(), 6);
@@ -730,9 +713,6 @@ mod tests {
         for handle in handles {
             handle.join().unwrap();
         }
-
-        // If we get here without panic, concurrent access works
-        assert!(true);
     }
 
     // ============= Edge Cases Tests =============
@@ -743,9 +723,6 @@ mod tests {
         RouterMetrics::record_request("");
         RouterMetrics::set_worker_health("", true);
         RouterMetrics::record_policy_decision("", "");
-
-        // If we get here without panic, empty strings are handled
-        assert!(true);
     }
 
     #[test]
@@ -754,14 +731,11 @@ mod tests {
 
         RouterMetrics::record_request(&long_label);
         RouterMetrics::set_worker_health(&long_label, false);
-
-        // If we get here without panic, long labels are handled
-        assert!(true);
     }
 
     #[test]
     fn test_special_characters_in_labels() {
-        let special_labels = vec![
+        let special_labels = [
             "test/with/slashes",
             "test-with-dashes",
             "test_with_underscores",
@@ -773,9 +747,6 @@ mod tests {
             RouterMetrics::record_request(label);
             RouterMetrics::set_worker_health(label, true);
         }
-
-        // If we get here without panic, special characters are handled
-        assert!(true);
     }
 
     #[test]
@@ -788,9 +759,7 @@ mod tests {
         RouterMetrics::set_worker_load("worker", usize::MAX);
 
         RouterMetrics::record_request_duration("route", Duration::from_nanos(1));
-        RouterMetrics::record_request_duration("route", Duration::from_secs(86400)); // 24 hours
-
-        // If we get here without panic, extreme values are handled
-        assert!(true);
+        // 24 hours
+        RouterMetrics::record_request_duration("route", Duration::from_secs(86400));
     }
 }
diff --git a/sgl-router/src/policies/power_of_two.rs b/sgl-router/src/policies/power_of_two.rs
index 601df6ae5..c10fc2949 100644
--- a/sgl-router/src/policies/power_of_two.rs
+++ b/sgl-router/src/policies/power_of_two.rs
@@ -141,7 +141,7 @@ mod tests {
             vec![Box::new(worker1), Box::new(worker2), Box::new(worker3)];
 
         // Run multiple selections
-        let mut selected_counts = vec![0; 3];
+        let mut selected_counts = [0; 3];
         for _ in 0..100 {
             if let Some(idx) = policy.select_worker(&workers, None) {
                 selected_counts[idx] += 1;
diff --git a/sgl-router/src/routers/header_utils.rs b/sgl-router/src/routers/header_utils.rs
index 92ce5d3b6..0adab5bf0 100644
--- a/sgl-router/src/routers/header_utils.rs
+++ b/sgl-router/src/routers/header_utils.rs
@@ -1,6 +1,6 @@
 use axum::body::Body;
 use axum::extract::Request;
-use axum::http::{HeaderMap, HeaderName, HeaderValue};
+use axum::http::HeaderMap;
 
 /// Copy request headers to a Vec of name-value string pairs
 /// Used for forwarding headers to backend workers
diff --git a/sgl-router/src/routers/pd_router.rs b/sgl-router/src/routers/pd_router.rs
index 79589ef5d..8a1a407a3 100644
--- a/sgl-router/src/routers/pd_router.rs
+++ b/sgl-router/src/routers/pd_router.rs
@@ -363,6 +363,7 @@ impl PDRouter {
         Ok(format!("Successfully removed decode server: {}", url))
     }
 
+    #[allow(clippy::too_many_arguments)]
     pub async fn new(
         prefill_urls: Vec<(String, Option<u16>)>,
         decode_urls: Vec<String>,
@@ -733,6 +734,7 @@ impl PDRouter {
     }
 
     // Internal method that performs the actual dual dispatch (without retry logic)
+    #[allow(clippy::too_many_arguments)]
     async fn execute_dual_dispatch_internal(
         &self,
         headers: Option<&HeaderMap>,
@@ -1145,7 +1147,7 @@ impl PDRouter {
         *response.status_mut() = status;
 
         // Use provided headers or create new ones, then ensure content-type is set for streaming
-        let mut headers = headers.unwrap_or_else(HeaderMap::new);
+        let mut headers = headers.unwrap_or_default();
         headers.insert(CONTENT_TYPE, HeaderValue::from_static("text/event-stream"));
         *response.headers_mut() = headers;
 
@@ -1160,41 +1162,41 @@ impl PDRouter {
         return_logprob: bool,
         prefill_body: Option<bytes::Bytes>,
     ) -> Response {
-        match res.bytes().await {
-            Ok(decode_body) => {
-                if return_logprob && prefill_body.is_some() {
-                    // Merge logprobs from prefill and decode
-                    let prefill_body = prefill_body.as_ref().unwrap();
-                    match (
-                        serde_json::from_slice::<Value>(prefill_body),
-                        serde_json::from_slice::<Value>(&decode_body),
-                    ) {
-                        (Ok(prefill_json), Ok(mut decode_json)) => {
-                            // Use helper to merge logprobs
-                            Self::merge_logprobs_in_json(&prefill_json, &mut decode_json);
-
-                            // Return merged response
-                            match serde_json::to_vec(&decode_json) {
-                                Ok(body) => (status, body).into_response(),
-                                Err(e) => {
-                                    error!("Failed to serialize merged response: {}", e);
-                                    (status, decode_body).into_response()
-                                }
-                            }
-                        }
-                        _ => {
-                            // If parsing fails, just return decode response
-                            warn!("Failed to parse responses for logprob merging");
-                            (status, decode_body).into_response()
-                        }
-                    }
-                } else {
-                    (status, decode_body).into_response()
-                }
-            }
+        let response = res.bytes().await;
+        let decode_body = match response {
+            Ok(decode_body) => decode_body,
             Err(e) => {
                 error!("Failed to read decode response: {}", e);
-                (StatusCode::INTERNAL_SERVER_ERROR, "Failed to read response").into_response()
+                return (StatusCode::INTERNAL_SERVER_ERROR, "Failed to read response")
+                    .into_response();
+            }
+        };
+
+        if !return_logprob {
+            return (status, decode_body).into_response();
+        }
+
+        let Some(prefill_body) = prefill_body else {
+            return (status, decode_body).into_response();
+        };
+
+        // Merge logprobs from prefill and decode
+        let (Ok(prefill_json), Ok(mut decode_json)) = (
+            serde_json::from_slice::<Value>(&prefill_body),
+            serde_json::from_slice::<Value>(&decode_body),
+        ) else {
+            warn!("Failed to parse responses for logprob merging");
+            return (status, decode_body).into_response();
+        };
+
+        Self::merge_logprobs_in_json(&prefill_json, &mut decode_json);
+
+        // Return merged response
+        match serde_json::to_vec(&decode_json) {
+            Ok(body) => (status, body).into_response(),
+            Err(e) => {
+                error!("Failed to serialize merged response: {}", e);
+                (status, decode_body).into_response()
             }
         }
     }
diff --git a/sgl-router/src/routers/router.rs b/sgl-router/src/routers/router.rs
index 36123a37c..87c8b70dd 100644
--- a/sgl-router/src/routers/router.rs
+++ b/sgl-router/src/routers/router.rs
@@ -45,6 +45,7 @@ pub struct Router {
 
 impl Router {
     /// Create a new router with injected policy and client
+    #[allow(clippy::too_many_arguments)]
     pub async fn new(
         worker_urls: Vec<String>,
         policy: Arc<dyn LoadBalancingPolicy>,
diff --git a/sgl-router/src/tree.rs b/sgl-router/src/tree.rs
index 828a6e41d..ea95a6946 100644
--- a/sgl-router/src/tree.rs
+++ b/sgl-router/src/tree.rs
@@ -38,6 +38,7 @@ struct EvictionEntry {
 
 impl Eq for EvictionEntry {}
 
+#[allow(clippy::non_canonical_partial_ord_impl)]
 impl PartialOrd for EvictionEntry {
     fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
         Some(self.timestamp.cmp(&other.timestamp))
@@ -862,8 +863,8 @@ mod tests {
         // spawn 3 threads for insert
         let tree_clone = Arc::clone(&tree);
 
-        let texts = vec!["hello", "apple", "banana"];
-        let tenants = vec!["tenant1", "tenant2", "tenant3"];
+        let texts = ["hello", "apple", "banana"];
+        let tenants = ["tenant1", "tenant2", "tenant3"];
 
         let mut handles = vec![];
 
@@ -916,13 +917,12 @@ mod tests {
         // spawn 3 threads for insert
         let tree_clone = Arc::clone(&tree);
 
-        let texts = vec!["apple", "apabc", "acbdeds"];
+        static TEXTS: [&str; 3] = ["apple", "apabc", "acbdeds"];
 
         let mut handles = vec![];
 
-        for i in 0..3 {
+        for text in TEXTS.iter() {
             let tree_clone = Arc::clone(&tree_clone);
-            let text = texts[i];
             let tenant = "tenant0";
 
             let handle = thread::spawn(move || {
@@ -942,14 +942,13 @@ mod tests {
 
         let tree_clone = Arc::clone(&tree);
 
-        for i in 0..3 {
+        for text in TEXTS.iter() {
             let tree_clone = Arc::clone(&tree_clone);
-            let text = texts[i];
             let tenant = "tenant0";
 
             let handle = thread::spawn(move || {
                 let (matched_text, matched_tenant) = tree_clone.prefix_match(text);
-                assert_eq!(matched_text, text);
+                assert_eq!(matched_text, *text);
                 assert_eq!(matched_tenant, tenant);
             });
 
@@ -964,13 +963,13 @@ mod tests {
 
     #[test]
     fn test_group_prefix_insert_match_concurrent() {
-        let prefix = vec![
+        static PREFIXES: [&str; 4] = [
             "Clock strikes midnight, I'm still wide awake",
             "Got dreams bigger than these city lights",
             "Time waits for no one, gotta make my move",
             "Started from the bottom, that's no metaphor",
         ];
-        let suffix = vec![
+        let suffixes = [
             "Got too much to prove, ain't got time to lose",
             "History in the making, yeah, you can't erase this",
         ];
@@ -978,10 +977,10 @@ mod tests {
 
         let mut handles = vec![];
 
-        for i in 0..prefix.len() {
-            for j in 0..suffix.len() {
+        for (i, prefix) in PREFIXES.iter().enumerate() {
+            for suffix in suffixes.iter() {
                 let tree_clone = Arc::clone(&tree);
-                let text = format!("{} {}", prefix[i], suffix[j]);
+                let text = format!("{} {}", prefix, suffix);
                 let tenant = format!("tenant{}", i);
 
                 let handle = thread::spawn(move || {
@@ -1000,17 +999,15 @@ mod tests {
         tree.pretty_print();
 
         // check matching using multi threads
-
         let mut handles = vec![];
 
-        for i in 0..prefix.len() {
+        for (i, prefix) in PREFIXES.iter().enumerate() {
             let tree_clone = Arc::clone(&tree);
-            let text = prefix[i];
 
             let handle = thread::spawn(move || {
-                let (matched_text, matched_tenant) = tree_clone.prefix_match(text);
+                let (matched_text, matched_tenant) = tree_clone.prefix_match(prefix);
                 let tenant = format!("tenant{}", i);
-                assert_eq!(matched_text, text);
+                assert_eq!(matched_text, *prefix);
                 assert_eq!(matched_tenant, tenant);
             });
 
@@ -1027,13 +1024,13 @@ mod tests {
     fn test_mixed_concurrent_insert_match() {
         // ensure it does not deadlock instead of doing correctness check
 
-        let prefix = vec![
+        static PREFIXES: [&str; 4] = [
             "Clock strikes midnight, I'm still wide awake",
             "Got dreams bigger than these city lights",
             "Time waits for no one, gotta make my move",
             "Started from the bottom, that's no metaphor",
         ];
-        let suffix = vec![
+        let suffixes = [
             "Got too much to prove, ain't got time to lose",
             "History in the making, yeah, you can't erase this",
         ];
@@ -1041,10 +1038,10 @@ mod tests {
 
         let mut handles = vec![];
 
-        for i in 0..prefix.len() {
-            for j in 0..suffix.len() {
+        for (i, prefix) in PREFIXES.iter().enumerate() {
+            for suffix in suffixes.iter() {
                 let tree_clone = Arc::clone(&tree);
-                let text = format!("{} {}", prefix[i], suffix[j]);
+                let text = format!("{} {}", prefix, suffix);
                 let tenant = format!("tenant{}", i);
 
                 let handle = thread::spawn(move || {
@@ -1056,13 +1053,11 @@ mod tests {
         }
 
         // check matching using multi threads
-
-        for i in 0..prefix.len() {
+        for prefix in PREFIXES.iter() {
             let tree_clone = Arc::clone(&tree);
-            let text = prefix[i];
 
             let handle = thread::spawn(move || {
-                let (_matched_text, _matched_tenant) = tree_clone.prefix_match(text);
+                let (_matched_text, _matched_tenant) = tree_clone.prefix_match(prefix);
             });
 
             handles.push(handle);
@@ -1080,16 +1075,14 @@ mod tests {
         // use .chars() to get the iterator of the utf-8 value
         let tree = Arc::new(Tree::new());
 
-        let test_pairs = vec![
+        static TEST_PAIRS: [(&str, &str); 3] = [
             ("你好嗎", "tenant1"),
             ("你好喔", "tenant2"),
             ("你心情好嗎", "tenant3"),
         ];
 
         // Insert sequentially
-        for i in 0..test_pairs.len() {
-            let text = test_pairs[i].0;
-            let tenant = test_pairs[i].1;
+        for (text, tenant) in TEST_PAIRS.iter() {
             tree.insert(text, tenant);
         }
 
@@ -1097,10 +1090,10 @@ mod tests {
 
         // Test sequentially
 
-        for i in 0..test_pairs.len() {
-            let (matched_text, matched_tenant) = tree.prefix_match(test_pairs[i].0);
-            assert_eq!(matched_text, test_pairs[i].0);
-            assert_eq!(matched_tenant, test_pairs[i].1);
+        for (text, tenant) in TEST_PAIRS.iter() {
+            let (matched_text, matched_tenant) = tree.prefix_match(text);
+            assert_eq!(matched_text, *text);
+            assert_eq!(matched_tenant, *tenant);
         }
     }
 
@@ -1108,7 +1101,7 @@ mod tests {
     fn test_utf8_split_concurrent() {
         let tree = Arc::new(Tree::new());
 
-        let test_pairs = vec![
+        static TEST_PAIRS: [(&str, &str); 3] = [
             ("你好嗎", "tenant1"),
             ("你好喔", "tenant2"),
             ("你心情好嗎", "tenant3"),
@@ -1117,13 +1110,11 @@ mod tests {
         // Create multiple threads for insertion
         let mut handles = vec![];
 
-        for i in 0..test_pairs.len() {
+        for (text, tenant) in TEST_PAIRS.iter() {
             let tree_clone = Arc::clone(&tree);
-            let text = test_pairs[i].0.to_string();
-            let tenant = test_pairs[i].1.to_string();
 
             let handle = thread::spawn(move || {
-                tree_clone.insert(&text, &tenant);
+                tree_clone.insert(text, tenant);
             });
 
             handles.push(handle);
@@ -1139,15 +1130,13 @@ mod tests {
         // Create multiple threads for matching
         let mut handles = vec![];
 
-        for i in 0..test_pairs.len() {
+        for (text, tenant) in TEST_PAIRS.iter() {
             let tree_clone = Arc::clone(&tree);
-            let text = test_pairs[i].0.to_string();
-            let tenant = test_pairs[i].1.to_string();
 
             let handle = thread::spawn(move || {
-                let (matched_text, matched_tenant) = tree_clone.prefix_match(&text);
-                assert_eq!(matched_text, text);
-                assert_eq!(matched_tenant, tenant);
+                let (matched_text, matched_tenant) = tree_clone.prefix_match(text);
+                assert_eq!(matched_text, *text);
+                assert_eq!(matched_tenant, *tenant);
             });
 
             handles.push(handle);
@@ -1202,7 +1191,7 @@ mod tests {
         let max_size: usize = 100;
 
         // Define prefixes
-        let prefixes = vec!["aqwefcisdf", "iajsdfkmade", "kjnzxcvewqe", "iejksduqasd"];
+        let prefixes = ["aqwefcisdf", "iajsdfkmade", "kjnzxcvewqe", "iejksduqasd"];
 
         // Insert strings with shared prefixes
         for _i in 0..100 {
diff --git a/sgl-router/tests/api_endpoints_test.rs b/sgl-router/tests/api_endpoints_test.rs
index 284fefb01..c67080d56 100644
--- a/sgl-router/tests/api_endpoints_test.rs
+++ b/sgl-router/tests/api_endpoints_test.rs
@@ -718,7 +718,7 @@ mod worker_management_tests {
         // Add the worker
         let req = Request::builder()
             .method("POST")
-            .uri(&format!("/add_worker?url={}", url))
+            .uri(format!("/add_worker?url={}", url))
             .body(Body::empty())
             .unwrap();
 
@@ -776,7 +776,7 @@ mod worker_management_tests {
         // Remove the worker
         let req = Request::builder()
             .method("POST")
-            .uri(&format!("/remove_worker?url={}", worker_url))
+            .uri(format!("/remove_worker?url={}", worker_url))
             .body(Body::empty())
             .unwrap();
 
@@ -856,7 +856,7 @@ mod worker_management_tests {
         // Add worker first time
         let req = Request::builder()
             .method("POST")
-            .uri(&format!("/add_worker?url={}", url))
+            .uri(format!("/add_worker?url={}", url))
             .body(Body::empty())
             .unwrap();
         let resp = app.clone().oneshot(req).await.unwrap();
@@ -867,7 +867,7 @@ mod worker_management_tests {
         // Try to add same worker again
         let req = Request::builder()
             .method("POST")
-            .uri(&format!("/add_worker?url={}", url))
+            .uri(format!("/add_worker?url={}", url))
             .body(Body::empty())
             .unwrap();
         let resp = app.oneshot(req).await.unwrap();
@@ -896,7 +896,7 @@ mod worker_management_tests {
         // Try to add unhealthy worker
         let req = Request::builder()
             .method("POST")
-            .uri(&format!("/add_worker?url={}", url))
+            .uri(format!("/add_worker?url={}", url))
             .body(Body::empty())
             .unwrap();
         let resp = app.oneshot(req).await.unwrap();
@@ -1412,7 +1412,7 @@ mod pd_mode_tests {
         // Extract port from prefill URL
         let prefill_port = prefill_url
             .split(':')
-            .last()
+            .next_back()
             .and_then(|p| p.trim_end_matches('/').parse::<u16>().ok())
             .unwrap_or(9000);
 
diff --git a/sgl-router/tests/benchmark_integration.rs b/sgl-router/tests/benchmark_integration.rs
index c8c99ea98..16406c461 100644
--- a/sgl-router/tests/benchmark_integration.rs
+++ b/sgl-router/tests/benchmark_integration.rs
@@ -116,6 +116,7 @@ fn default_completion_request() -> CompletionRequest {
     }
 }
 
+#[allow(dead_code)]
 fn create_test_worker() -> BasicWorker {
     BasicWorker::new(
         "http://test-server:8000".to_string(),
diff --git a/sgl-router/tests/common/test_app.rs b/sgl-router/tests/common/test_app.rs
index 7c4cf76eb..d4961f9c3 100644
--- a/sgl-router/tests/common/test_app.rs
+++ b/sgl-router/tests/common/test_app.rs
@@ -8,6 +8,7 @@ use sglang_router_rs::{
 use std::sync::Arc;
 
 /// Create a test Axum application using the actual server's build_app function
+#[allow(dead_code)]
 pub fn create_test_app(
     router: Arc<dyn RouterTrait>,
     client: Client,
diff --git a/sgl-router/tests/request_formats_test.rs b/sgl-router/tests/request_formats_test.rs
index 431e944d3..c0217c590 100644
--- a/sgl-router/tests/request_formats_test.rs
+++ b/sgl-router/tests/request_formats_test.rs
@@ -99,7 +99,7 @@ impl TestContext {
         let worker_url = &worker_urls[0];
 
         let response = client
-            .post(&format!("{}{}", worker_url, endpoint))
+            .post(format!("{}{}", worker_url, endpoint))
             .json(&body)
             .send()
             .await
diff --git a/sgl-router/tests/streaming_tests.rs b/sgl-router/tests/streaming_tests.rs
index 4674593b8..4d1e65cb0 100644
--- a/sgl-router/tests/streaming_tests.rs
+++ b/sgl-router/tests/streaming_tests.rs
@@ -100,7 +100,7 @@ impl TestContext {
         let worker_url = &worker_urls[0];
 
         let response = client
-            .post(&format!("{}{}", worker_url, endpoint))
+            .post(format!("{}{}", worker_url, endpoint))
             .json(&body)
             .send()
             .await
@@ -128,8 +128,8 @@ impl TestContext {
             if let Ok(bytes) = chunk {
                 let text = String::from_utf8_lossy(&bytes);
                 for line in text.lines() {
-                    if line.starts_with("data: ") {
-                        events.push(line[6..].to_string());
+                    if let Some(stripped) = line.strip_prefix("data: ") {
+                        events.push(stripped.to_string());
                     }
                 }
             }
diff --git a/sgl-router/tests/test_pd_routing.rs b/sgl-router/tests/test_pd_routing.rs
index 6035da0a8..2bf47b187 100644
--- a/sgl-router/tests/test_pd_routing.rs
+++ b/sgl-router/tests/test_pd_routing.rs
@@ -1,6 +1,5 @@
 #[cfg(test)]
 mod test_pd_routing {
-    use rand::Rng;
     use serde_json::json;
     use sglang_router_rs::config::{
         CircuitBreakerConfig, PolicyConfig, RetryConfig, RouterConfig, RoutingMode,
@@ -421,41 +420,6 @@ mod test_pd_routing {
         assert_eq!(received_loads.get("http://decode2:8080"), Some(&15));
     }
 
-    #[test]
-    fn test_power_of_two_load_selection() {
-        // Test the power-of-two selection logic with different load scenarios
-
-        // Scenario 1: Clear winner for both prefill and decode
-        let _loads = vec![
-            ("prefill1", 100),
-            ("prefill2", 10), // Should be selected
-            ("decode1", 50),
-            ("decode2", 5), // Should be selected
-        ];
-
-        // In actual implementation, the lower load should be selected
-        assert!(10 < 100);
-        assert!(5 < 50);
-
-        // Scenario 2: Equal loads (should select first)
-        let _equal_loads = vec![
-            ("prefill1", 20),
-            ("prefill2", 20), // Either could be selected
-            ("decode1", 30),
-            ("decode2", 30), // Either could be selected
-        ];
-
-        // When loads are equal, <= comparison means first is selected
-        assert!(20 <= 20);
-        assert!(30 <= 30);
-
-        // Scenario 3: Missing load data (should default to usize::MAX)
-        // This tests the unwrap_or(usize::MAX) behavior
-        let missing_load = usize::MAX;
-        assert!(10 < missing_load);
-        assert!(missing_load > 0);
-    }
-
     #[test]
     fn test_load_monitoring_configuration() {
         // Test that load monitoring is only enabled for PowerOfTwo policy
@@ -605,12 +569,10 @@ mod test_pd_routing {
     #[test]
     fn test_streaming_response_parsing() {
         // Test SSE format parsing from streaming responses
-        let sse_chunks = vec![
-            "data: {\"text\":\"Hello\",\"meta_info\":{\"completion_tokens\":1,\"finish_reason\":null}}",
+        let sse_chunks = ["data: {\"text\":\"Hello\",\"meta_info\":{\"completion_tokens\":1,\"finish_reason\":null}}",
             "data: {\"text\":\" world\",\"meta_info\":{\"completion_tokens\":2,\"finish_reason\":null}}",
             "data: {\"text\":\"!\",\"meta_info\":{\"completion_tokens\":3,\"finish_reason\":{\"type\":\"length\"}}}",
-            "data: [DONE]",
-        ];
+            "data: [DONE]"];
 
         for chunk in &sse_chunks[..3] {
             assert!(chunk.starts_with("data: "));
@@ -848,7 +810,7 @@ mod test_pd_routing {
             large_batch_request["bootstrap_host"] = json!(vec![hostname; batch_size]);
             large_batch_request["bootstrap_port"] = json!(vec![bootstrap_port; batch_size]);
             large_batch_request["bootstrap_room"] = json!((0..batch_size)
-                .map(|_| rand::thread_rng().gen::<u64>())
+                .map(|_| rand::random::<u64>())
                 .collect::<Vec<_>>());
 
             let elapsed = start.elapsed();