make client immutate (#94)

kerthcet · web-flow · commit b3e3bf66767f · 2026-01-04T03:38:47.000Z
Signed-off-by: kerthcet &lt;kerthcet@gmail.com&gt;
diff --git a/README.md b/README.md
@@ -67,7 +67,7 @@ fn main() {
         .build()
         .unwrap();
 
-    let mut client = client::Client::new(config);
+    let client = client::Client::new(config);
     let request = chat::CreateChatCompletionRequestArgs::default()
         .messages([
             chat::ChatCompletionRequestSystemMessage::from("You are a helpful assistant.").into(),
diff --git a/examples/wrr.rs b/examples/wrr.rs
@@ -23,7 +23,7 @@ fn main() {
         .build()
         .unwrap();
 
-    let mut client = client::Client::new(config);
+    let client = client::Client::new(config);
     let request = chat::CreateChatCompletionRequestArgs::default()
         .messages([
             chat::ChatCompletionRequestSystemMessage::from("You are a helpful assistant.").into(),
diff --git a/src/client/client.rs b/src/client/client.rs
@@ -29,7 +29,7 @@ impl Client {
     }
 
     pub async fn create_response(
-        &mut self,
+        &self,
         request: responses::CreateResponse,
     ) -> Result<responses::Response, OpenAIError> {
         let candidate = self.router.sample();
@@ -39,7 +39,7 @@ impl Client {
 
     // This is chat completion endpoint.
     pub async fn create_completion(
-        &mut self,
+        &self,
         request: chat::CreateChatCompletionRequest,
     ) -> Result<chat::CreateChatCompletionResponse, OpenAIError> {
         let candidate = self.router.sample();
diff --git a/src/router/random.rs b/src/router/random.rs
@@ -18,7 +18,7 @@ impl Router for RandomRouter {
         "RandomRouter"
     }
 
-    fn sample(&mut self) -> ModelName {
+    fn sample(&self) -> ModelName {
         let mut rng = rand::rng();
         let idx = rng.random_range(0..self.model_infos.len());
         self.model_infos[idx].name.clone()
diff --git a/src/router/router.rs b/src/router/router.rs
@@ -24,7 +24,7 @@ pub fn construct_router(mode: RouterMode, models: Vec<ModelConfig>) -> Box<dyn R
 
 pub trait Router {
     fn name(&self) -> &'static str;
-    fn sample(&mut self) -> ModelName;
+    fn sample(&self) -> ModelName;
 }
 
 #[cfg(test)]
diff --git a/src/router/wrr.rs b/src/router/wrr.rs
@@ -1,11 +1,13 @@
+use std::sync::atomic::AtomicI32;
+
 use crate::client::config::ModelName;
 use crate::router::router::{ModelInfo, Router};
 
 pub struct WeightedRoundRobinRouter {
     total_weight: i32,
     model_infos: Vec<ModelInfo>,
     // current_weight is ordered by model_infos index.
-    current_weights: Vec<i32>,
+    current_weights: Vec<AtomicI32>,
 }
 
 impl WeightedRoundRobinRouter {
@@ -16,7 +18,7 @@ impl WeightedRoundRobinRouter {
         Self {
             model_infos: model_infos,
             total_weight: total_weight,
-            current_weights: vec![0; length],
+            current_weights: (0..length).map(|_| AtomicI32::new(0)).collect(),
         }
     }
 }
@@ -27,27 +29,28 @@ impl Router for WeightedRoundRobinRouter {
     }
 
     // Use Smooth Weighted Round Robin Algorithm.
-    fn sample(&mut self) -> ModelName {
+    fn sample(&self) -> ModelName {
         // return early if only one model.
         if self.model_infos.len() == 1 {
             return self.model_infos[0].name.clone();
         }
 
-        self.current_weights
-            .iter_mut()
-            .enumerate()
-            .for_each(|(i, weight)| {
-                *weight += self.model_infos[i].weight;
-            });
+        // 1. add weight to current weight.
+        self.model_infos.iter().enumerate().for_each(|(i, weight)| {
+            self.current_weights[i].fetch_add(weight.weight, std::sync::atomic::Ordering::Relaxed);
+        });
 
         let mut max_index = 0;
         for i in 1..self.current_weights.len() {
-            if self.current_weights[i] > self.current_weights[max_index] {
+            if self.current_weights[i].load(std::sync::atomic::Ordering::Relaxed)
+                > self.current_weights[max_index].load(std::sync::atomic::Ordering::Relaxed)
+            {
                 max_index = i;
             }
         }
 
-        self.current_weights[max_index] -= self.total_weight;
+        self.current_weights[max_index]
+            .fetch_sub(self.total_weight, std::sync::atomic::Ordering::Relaxed);
         self.model_infos[max_index].name.clone()
     }
 }
diff --git a/tests/client.rs b/tests/client.rs
@@ -8,6 +8,31 @@ use arms::types::responses;
 mod tests {
     use super::*;
 
+    #[tokio::test]
+    async fn test_completion() {
+        from_filename(".env.integration-test").ok();
+
+        let config = client::Config::builder()
+            .provider("faker")
+            .model(
+                client::ModelConfig::builder()
+                    .name("fake-completion-model")
+                    .build()
+                    .unwrap(),
+            )
+            .build()
+            .unwrap();
+
+        let client = client::Client::new(config);
+        let request = chat::CreateChatCompletionRequestArgs::default()
+            .build()
+            .unwrap();
+
+        let response = client.create_completion(request).await.unwrap();
+        assert!(response.id.starts_with("fake-completion-id"));
+        assert!(response.model == "fake-completion-model");
+    }
+
     #[tokio::test]
     async fn test_response() {
         from_filename(".env.integration-test").ok();
@@ -24,7 +49,7 @@ mod tests {
             .build()
             .unwrap();
 
-        let mut client = client::Client::new(config);
+        let client = client::Client::new(config);
         let request = responses::CreateResponseArgs::default()
             .input("tell me the weather today")
             .build()
@@ -45,7 +70,7 @@ mod tests {
             )
             .build()
             .unwrap();
-        let mut client = client::Client::new(config);
+        let client = client::Client::new(config);
         let request = responses::CreateResponseArgs::default()
             .model("gpt-3.5-turbo")
             .input("tell me a joke")
@@ -74,36 +99,11 @@ mod tests {
             )
             .build()
             .unwrap();
-        let mut client = client::Client::new(config);
+        let client = client::Client::new(config);
         let request = responses::CreateResponseArgs::default()
             .input("give me a poem about nature")
             .build()
             .unwrap();
         let _ = client.create_response(request).await.unwrap();
     }
-
-    #[tokio::test]
-    async fn test_completion() {
-        from_filename(".env.integration-test").ok();
-
-        let config = client::Config::builder()
-            .provider("faker")
-            .model(
-                client::ModelConfig::builder()
-                    .name("fake-completion-model")
-                    .build()
-                    .unwrap(),
-            )
-            .build()
-            .unwrap();
-
-        let mut client = client::Client::new(config);
-        let request = chat::CreateChatCompletionRequestArgs::default()
-            .build()
-            .unwrap();
-
-        let response = client.create_completion(request).await.unwrap();
-        assert!(response.id.starts_with("fake-completion-id"));
-        assert!(response.model == "fake-completion-model");
-    }
 }

Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@ impl Router for RandomRouter {`
`18`	`18`	`"RandomRouter"`
`19`	`19`	`}`
`20`	`20`
`21`		`- fn sample(&mut self) -> ModelName {`
	`21`	`+ fn sample(&self) -> ModelName {`
`22`	`22`	`let mut rng = rand::rng();`
`23`	`23`	`let idx = rng.random_range(0..self.model_infos.len());`
`24`	`24`	`self.model_infos[idx].name.clone()`
Original file line number	Diff line number	Diff line change
`@@ -24,7 +24,7 @@ pub fn construct_router(mode: RouterMode, models: Vec<ModelConfig>) -> Box<dyn R`
`24`	`24`
`25`	`25`	`pub trait Router {`
`26`	`26`	`fn name(&self) -> &'static str;`
`27`		`- fn sample(&mut self) -> ModelName;`
	`27`	`+ fn sample(&self) -> ModelName;`
`28`	`28`	`}`
`29`	`29`
`30`	`30`	`#[cfg(test)]`
Original file line number	Diff line number	Diff line change
`@@ -1,11 +1,13 @@`
	`1`	`+use std::sync::atomic::AtomicI32;`
	`2`	`+`
`1`	`3`	`use crate::client::config::ModelName;`
`2`	`4`	`use crate::router::router::{ModelInfo, Router};`
`3`	`5`
`4`	`6`	`pub struct WeightedRoundRobinRouter {`
`5`	`7`	`total_weight: i32,`
`6`	`8`	`model_infos: Vec<ModelInfo>,`
`7`	`9`	`// current_weight is ordered by model_infos index.`
`8`		`- current_weights: Vec<i32>,`
	`10`	`+ current_weights: Vec<AtomicI32>,`
`9`	`11`	`}`
`10`	`12`
`11`	`13`	`impl WeightedRoundRobinRouter {`
`@@ -16,7 +18,7 @@ impl WeightedRoundRobinRouter {`
`16`	`18`	`Self {`
`17`	`19`	`model_infos: model_infos,`
`18`	`20`	`total_weight: total_weight,`
`19`		`- current_weights: vec![0; length],`
	`21`	`+ current_weights: (0..length).map(\|_\| AtomicI32::new(0)).collect(),`
`20`	`22`	`}`
`21`	`23`	`}`
`22`	`24`	`}`
`@@ -27,27 +29,28 @@ impl Router for WeightedRoundRobinRouter {`
`27`	`29`	`}`
`28`	`30`
`29`	`31`	`// Use Smooth Weighted Round Robin Algorithm.`
`30`		`- fn sample(&mut self) -> ModelName {`
	`32`	`+ fn sample(&self) -> ModelName {`
`31`	`33`	`// return early if only one model.`
`32`	`34`	`if self.model_infos.len() == 1 {`
`33`	`35`	`return self.model_infos[0].name.clone();`
`34`	`36`	`}`
`35`	`37`
`36`		`- self.current_weights`
`37`		`- .iter_mut()`
`38`		`- .enumerate()`
`39`		`- .for_each(\|(i, weight)\| {`
`40`		`- *weight += self.model_infos[i].weight;`
`41`		`- });`
	`38`	`+ // 1. add weight to current weight.`
	`39`	`+ self.model_infos.iter().enumerate().for_each(\|(i, weight)\| {`
	`40`	`+ self.current_weights[i].fetch_add(weight.weight, std::sync::atomic::Ordering::Relaxed);`
	`41`	`+ });`
`42`	`42`
`43`	`43`	`let mut max_index = 0;`
`44`	`44`	`for i in 1..self.current_weights.len() {`
`45`		`- if self.current_weights[i] > self.current_weights[max_index] {`
	`45`	`+ if self.current_weights[i].load(std::sync::atomic::Ordering::Relaxed)`
	`46`	`+ > self.current_weights[max_index].load(std::sync::atomic::Ordering::Relaxed)`
	`47`	`+ {`
`46`	`48`	`max_index = i;`
`47`	`49`	`}`
`48`	`50`	`}`
`49`	`51`
`50`		`- self.current_weights[max_index] -= self.total_weight;`
	`52`	`+ self.current_weights[max_index]`
	`53`	`+ .fetch_sub(self.total_weight, std::sync::atomic::Ordering::Relaxed);`
`51`	`54`	`self.model_infos[max_index].name.clone()`
`52`	`55`	`}`
`53`	`56`	`}`