aws · swapneils · Jun 21, 2025 · dingfeli · Jul 7, 2025 · swapneils
diff --git a/crates/chat-cli/src/api_client/mod.rs b/crates/chat-cli/src/api_client/mod.rs
@@ -31,6 +31,7 @@ pub use endpoints::Endpoint;
 pub use error::ApiClientError;
 use parking_lot::Mutex;
 pub use profile::list_available_profiles;
+
 use serde_json::Map;
 use tracing::{
     debug,
@@ -446,6 +447,7 @@ impl ApiClient {
 
         self.mock_client = Some(Arc::new(Mutex::new(mock.into_iter())));
     }
+
 }
 
 fn timeout_config(database: &Database) -> TimeoutConfig {

diff --git a/crates/chat-cli/src/cli/chat/mod.rs b/crates/chat-cli/src/cli/chat/mod.rs
@@ -284,7 +284,7 @@ impl ChatArgs {
         info!(?conversation_id, "Generated new conversation id");
         let (prompt_request_sender, prompt_request_receiver) = std::sync::mpsc::channel::<Option<String>>();
         let (prompt_response_sender, prompt_response_receiver) = std::sync::mpsc::channel::<Vec<String>>();
-        let mut tool_manager = ToolManagerBuilder::default()
+        let (mut tool_manager, sampling_receiver) = ToolManagerBuilder::default()
             .prompt_list_sender(prompt_response_sender)
             .prompt_list_receiver(prompt_request_receiver)
             .conversation_id(&conversation_id)
@@ -293,6 +293,9 @@ impl ChatArgs {
             .await?;
         let tool_config = tool_manager.load_tools(os, &mut stderr).await?;
 
+        // Set the ApiClient for MCP clients that have sampling enabled
+        tool_manager.set_streaming_client(std::sync::Arc::new(os.client.clone()));
+
         ChatSession::new(
             os,
             stdout,
@@ -307,6 +310,7 @@ impl ChatArgs {
             model_id,
             tool_config,
             !self.no_interactive,
+            sampling_receiver,
         )
         .await?
         .spawn(os)
@@ -480,6 +484,8 @@ pub struct ChatSession {
     conversation: ConversationState,
     tool_uses: Vec<QueuedTool>,
     pending_tool_index: Option<usize>,
+    /// Channel receiver for incoming sampling requests from MCP servers
+    sampling_receiver: tokio::sync::mpsc::UnboundedReceiver<crate::mcp_client::sampling_ipc::PendingSamplingRequest>,
     /// Telemetry events to be sent as part of the conversation.
     tool_use_telemetry_events: HashMap<String, ToolUseEventBuilder>,
     /// State used to keep track of tool use relation
@@ -508,6 +514,7 @@ impl ChatSession {
         model_id: Option<String>,
         tool_config: HashMap<String, ToolSpec>,
         interactive: bool,
+        sampling_receiver: tokio::sync::mpsc::UnboundedReceiver<crate::mcp_client::sampling_ipc::PendingSamplingRequest>,
     ) -> Result<Self> {
         let valid_model_id = match model_id {
             Some(id) => id,
@@ -584,6 +591,7 @@ impl ChatSession {
             conversation,
             tool_uses: vec![],
             pending_tool_index: None,
+            sampling_receiver,
             tool_use_telemetry_events: HashMap::new(),
             tool_use_status: ToolUseStatus::Idle,
             failed_request_ids: Vec::new(),
@@ -1267,6 +1275,17 @@ impl ChatSession {
                 .put_skim_command_selector(os, Arc::new(context_manager.clone()), tool_names);
         }
 
+        // Check for incoming sampling requests and automatically approve them
+        // Since servers now opt-in via configuration, any request that comes through should be approved
+        while let Ok(mut sampling_request) = self.sampling_receiver.try_recv() {
+            tracing::info!(target: "mcp", "Auto-approving sampling request from configured server: {}", sampling_request.server_name);
+
+            // Automatically approve the sampling request
+            sampling_request.send_approval_result(
+                crate::mcp_client::sampling_ipc::SamplingApprovalResult::approved()
+            );
+        }
+
         execute!(
             self.stderr,
             style::SetForegroundColor(Color::Reset),
@@ -2360,6 +2379,12 @@ mod tests {
         agents
     }
 
+    #[cfg(test)]
+    fn create_dummy_sampling_receiver() -> tokio::sync::mpsc::UnboundedReceiver<crate::mcp_client::sampling_ipc::PendingSamplingRequest> {
+        let (_sender, receiver) = tokio::sync::mpsc::unbounded_channel();
+        receiver
+    }
+
     #[tokio::test]
     async fn test_flow() {
         let mut os = Os::new().await.unwrap();
@@ -2403,6 +2428,7 @@ mod tests {
             None,
             tool_config,
             true,
+            create_dummy_sampling_receiver(),
         )
         .await
         .unwrap()
@@ -2544,6 +2570,7 @@ mod tests {
             None,
             tool_config,
             true,
+            create_dummy_sampling_receiver(),
         )
         .await
         .unwrap()
@@ -2640,6 +2667,7 @@ mod tests {
             None,
             tool_config,
             true,
+            create_dummy_sampling_receiver(),
         )
         .await
         .unwrap()
@@ -2714,6 +2742,7 @@ mod tests {
             None,
             tool_config,
             true,
+            create_dummy_sampling_receiver(),
         )
         .await
         .unwrap()
@@ -2764,6 +2793,7 @@ mod tests {
             None,
             tool_config,
             true,
+            create_dummy_sampling_receiver(),
         )
         .await
         .unwrap()

diff --git a/crates/chat-cli/src/cli/chat/tool_manager.rs b/crates/chat-cli/src/cli/chat/tool_manager.rs
@@ -183,7 +183,7 @@ impl ToolManagerBuilder {
         os: &mut Os,
         mut output: Box<dyn Write + Send + Sync + 'static>,
         interactive: bool,
-    ) -> eyre::Result<ToolManager> {
+    ) -> eyre::Result<(ToolManager, tokio::sync::mpsc::UnboundedReceiver<crate::mcp_client::sampling_ipc::PendingSamplingRequest>)> {
         let McpServerConfig { mcp_servers } = self.mcp_server_config.ok_or(eyre::eyre!("Missing mcp server config"))?;
         debug_assert!(self.conversation_id.is_some());
         let conversation_id = self.conversation_id.ok_or(eyre::eyre!("Missing conversation id"))?;
@@ -199,6 +199,9 @@ impl ToolManagerBuilder {
             .map(|(server_name, _)| server_name.clone())
             .collect();
 
+        // Create channel for sampling requests
+        let (sampling_sender, sampling_receiver) = tokio::sync::mpsc::unbounded_channel();
+
         let pre_initialized = enabled_servers
             .into_iter()
             .filter_map(|(server_name, server_config)| {
@@ -211,7 +214,11 @@ impl ToolManagerBuilder {
                     );
                     None
                 } else {
-                    let custom_tool_client = CustomToolClient::from_config(server_name.clone(), server_config);
+                    let custom_tool_client = CustomToolClient::from_config(
+                        server_name.clone(),
+                        server_config,
+                        Some(sampling_sender.clone()),
+                    );
                     Some((server_name, custom_tool_client))
                 }
             })
@@ -687,7 +694,7 @@ impl ToolManagerBuilder {
             });
         }
 
-        Ok(ToolManager {
+        let tool_manager = ToolManager {
             conversation_id,
             clients,
             prompts,
@@ -701,8 +708,11 @@ impl ToolManagerBuilder {
             mcp_load_record: load_record,
             agent,
             disabled_servers: disabled_servers_display,
+            sampling_request_sender: Some(sampling_sender),
             ..Default::default()
-        })
+        };
+
+        Ok((tool_manager, sampling_receiver))
     }
 }
 
@@ -829,6 +839,9 @@ pub struct ToolManager {
     /// The value is the load message (i.e. load time, warnings, and errors)
     pub mcp_load_record: Arc<Mutex<HashMap<String, Vec<LoadingRecord>>>>,
 
+    /// Channel sender for MCP clients to send sampling requests for approval
+    pub sampling_request_sender: Option<tokio::sync::mpsc::UnboundedSender<crate::mcp_client::sampling_ipc::PendingSamplingRequest>>,
+
     /// List of disabled MCP server names for display purposes
     disabled_servers: Vec<String>,
 
@@ -850,12 +863,24 @@ impl Clone for ToolManager {
             is_interactive: self.is_interactive,
             mcp_load_record: self.mcp_load_record.clone(),
             disabled_servers: self.disabled_servers.clone(),
+            sampling_request_sender: self.sampling_request_sender.clone(),
             ..Default::default()
         }
     }
 }
 
 impl ToolManager {
+    /// Set the ApiClient for all MCP clients that have sampling enabled
+    pub fn set_streaming_client(&self, api_client: std::sync::Arc<crate::api_client::ApiClient>) {
+        tracing::info!(target: "mcp", "Setting ApiClient for MCP clients with sampling enabled");
+
+        for (server_name, client) in &self.clients {
+            // Use the shared reference to call set_streaming_client
+            client.set_streaming_client(api_client.clone());
+            tracing::debug!(target: "mcp", "Set ApiClient for server: {}", server_name);
+        }
+    }
+
     pub async fn load_tools(
         &mut self,
         os: &mut Os,

diff --git a/crates/chat-cli/src/cli/chat/tools/custom_tool.rs b/crates/chat-cli/src/cli/chat/tools/custom_tool.rs
@@ -48,6 +48,8 @@ pub struct CustomToolConfig {
     pub timeout: u64,
     #[serde(default)]
     pub disabled: bool,
+    #[serde(default)]
+    pub sampling: bool,
 }
 
 pub fn default_timeout() -> u64 {
@@ -66,14 +68,32 @@ pub enum CustomToolClient {
 
 impl CustomToolClient {
     // TODO: add support for http transport
-    pub fn from_config(server_name: String, config: CustomToolConfig) -> Result<Self> {
+    /// Set the ApiClient for LLM integration in sampling requests
+    pub fn set_streaming_client(&self, api_client: std::sync::Arc<crate::api_client::ApiClient>) {
+        match self {
+            CustomToolClient::Stdio { client, .. } => {
+                client.set_streaming_client(api_client);
+            }
+        }
+    }
+
+    pub fn from_config(
+        server_name: String,
+        config: CustomToolConfig,
+        sampling_sender: Option<tokio::sync::mpsc::UnboundedSender<crate::mcp_client::sampling_ipc::PendingSamplingRequest>>,
+    ) -> Result<Self> {
         let CustomToolConfig {
             command,
             args,
             env,
             timeout,
             disabled: _,
+            sampling,
         } = config;
+
+        // Only pass sampling_sender if sampling is enabled for this server
+        let conditional_sampling_sender = if sampling { sampling_sender } else { None };
+
         let mcp_client_config = McpClientConfig {
             server_name: server_name.clone(),
             bin_path: command.clone(),
@@ -84,6 +104,7 @@ impl CustomToolClient {
                "version": "1.0.0"
             }),
             env,
+            sampling_sender: conditional_sampling_sender,
         };
         let client = McpClient::<JsonRpcStdioTransport>::from_config(mcp_client_config)?;
         Ok(CustomToolClient::Stdio {