codestoryai · devin-ai-integration · May 14, 2025
diff --git a/llm_client/src/clients/openai.rs b/llm_client/src/clients/openai.rs
@@ -243,8 +243,19 @@ impl LLMClient for OpenAIClient {
             request_builder = request_builder.temperature(request.temperature());
         }
 
-        // if its o1 or o3-mini we should set reasoning_effort to high
-        if llm_model == &LLMType::O1 || llm_model == &LLMType::O3MiniHigh {
+        if let Some(reasoning_effort) = request.reasoning_effort() {
+            match reasoning_effort {
+                crate::clients::types::ReasoningEffort::Low => {
+                    request_builder = request_builder.reasoning_effort(ReasoningEffort::Low);
+                }
+                crate::clients::types::ReasoningEffort::Medium => {
+                    request_builder = request_builder.reasoning_effort(ReasoningEffort::Medium);
+                }
+                crate::clients::types::ReasoningEffort::High => {
+                    request_builder = request_builder.reasoning_effort(ReasoningEffort::High);
+                }
+            }
+        } else if llm_model == &LLMType::O1 || llm_model == &LLMType::O3MiniHigh {
             request_builder = request_builder.reasoning_effort(ReasoningEffort::High);
         }
 

diff --git a/llm_client/src/clients/openai_compatible.rs b/llm_client/src/clients/openai_compatible.rs
@@ -167,6 +167,20 @@ impl LLMClient for OpenAICompatibleClient {
             .messages(messages)
             .temperature(request.temperature())
             .stream(true);
+
+        if let Some(reasoning_effort) = request.reasoning_effort() {
+            match reasoning_effort {
+                crate::clients::types::ReasoningEffort::Low => {
+                    request_builder = request_builder.reasoning_effort(async_openai::types::ReasoningEffort::Low);
+                }
+                crate::clients::types::ReasoningEffort::Medium => {
+                    request_builder = request_builder.reasoning_effort(async_openai::types::ReasoningEffort::Medium);
+                }
+                crate::clients::types::ReasoningEffort::High => {
+                    request_builder = request_builder.reasoning_effort(async_openai::types::ReasoningEffort::High);
+                }
+            }
+        }
         if let Some(frequency_penalty) = request.frequency_penalty() {
             request_builder = request_builder.frequency_penalty(frequency_penalty);
         }

diff --git a/llm_client/src/clients/types.rs b/llm_client/src/clients/types.rs
@@ -685,6 +685,13 @@ impl LLMClientMessage {
     }
 }
 
+#[derive(Clone, Debug, PartialEq, Eq)]
+pub enum ReasoningEffort {
+    Low,
+    Medium,
+    High,
+}
+
 #[derive(Clone, Debug)]
 pub struct LLMClientCompletionRequest {
     model: LLMType,
@@ -693,6 +700,7 @@ pub struct LLMClientCompletionRequest {
     frequency_penalty: Option<f32>,
     stop_words: Option<Vec<String>>,
     max_tokens: Option<usize>,
+    reasoning_effort: Option<ReasoningEffort>,
 }
 
 #[derive(Clone)]
@@ -771,6 +779,7 @@ impl LLMClientCompletionRequest {
             frequency_penalty,
             stop_words: None,
             max_tokens: None,
+            reasoning_effort: None,
         }
     }
 
@@ -859,6 +868,15 @@ impl LLMClientCompletionRequest {
     pub fn get_max_tokens(&self) -> Option<usize> {
         self.max_tokens
     }
+
+    pub fn set_reasoning_effort(mut self, reasoning_effort: ReasoningEffort) -> Self {
+        self.reasoning_effort = Some(reasoning_effort);
+        self
+    }
+
+    pub fn reasoning_effort(&self) -> Option<&ReasoningEffort> {
+        self.reasoning_effort.as_ref()
+    }
 }
 
 #[derive(Debug, Clone, Default, serde::Serialize, serde::Deserialize)]