CodeGraph CLI MCP Server

qwen.rs•8.92 kB

use codegraph_core::{CodeGraphError, Result}; use reqwest::{Client, ClientBuilder}; use serde::{Deserialize, Serialize}; use std::time::{Duration, Instant}; use tracing::{debug, info, warn}; /// Simple Qwen2.5-Coder client for MCP integration #[derive(Debug, Clone)] pub struct QwenConfig { pub model_name: String, pub base_url: String, pub context_window: usize, pub max_tokens: usize, pub temperature: f32, pub request_timeout: Option<Duration>, pub connect_timeout: Duration, } impl Default for QwenConfig { fn default() -> Self { let request_timeout = std::env::var("CODEGRAPH_QWEN_TIMEOUT_SECS") .ok() .and_then(|raw| raw.parse::<u64>().ok()) .and_then(|secs| (secs > 0).then(|| Duration::from_secs(secs))); let connect_timeout = std::env::var("CODEGRAPH_QWEN_CONNECT_TIMEOUT_MS") .ok() .and_then(|raw| raw.parse::<u64>().ok()) .map(Duration::from_millis) .unwrap_or_else(|| Duration::from_secs(5)); let max_tokens = std::env::var("CODEGRAPH_QWEN_MAX_TOKENS") .ok() .and_then(|raw| raw.parse::<usize>().ok()) .filter(|value| *value > 0) .unwrap_or(1024); Self { model_name: std::env::var("CODEGRAPH_MODEL").unwrap_or_else(|_| { "hf.co/unsloth/Qwen2.5-Coder-14B-Instruct-128K-GGUF:Q4_K_M".to_string() }), base_url: "http://localhost:11434".to_string(), context_window: 128000, max_tokens, temperature: 0.1, request_timeout, connect_timeout, } } } #[derive(Debug, Serialize)] struct OllamaRequest { model: String, messages: Vec<Message>, stream: bool, options: OllamaOptions, } #[derive(Debug, Serialize)] struct Message { role: String, content: String, } #[derive(Debug, Serialize)] struct OllamaOptions { temperature: f32, num_predict: usize, num_ctx: usize, } #[derive(Debug, Deserialize)] struct OllamaResponse { #[serde(default)] message: Option<MessageResponse>, #[serde(default)] eval_count: Option<usize>, #[serde(default)] prompt_eval_count: Option<usize>, } #[derive(Debug, Deserialize)] struct MessageResponse { role: String, content: String, } #[derive(Debug, Clone)] pub struct QwenResult { pub text: String, pub model_used: String, pub processing_time: Duration, pub context_tokens: usize, pub completion_tokens: usize, pub confidence_score: f32, } #[derive(Clone)] pub struct QwenClient { client: Client, pub config: QwenConfig, } impl QwenClient { pub fn new(config: QwenConfig) -> Self { let mut builder = ClientBuilder::new() .pool_idle_timeout(None) .tcp_keepalive(Some(Duration::from_secs(30))) .connect_timeout(config.connect_timeout); if let Some(timeout) = config.request_timeout { builder = builder.timeout(timeout); } let client = builder.build().expect("Failed to build Qwen HTTP client"); Self { client, config } } /// Generate semantic analysis using Qwen2.5-Coder with optimized prompts pub async fn analyze_codebase(&self, query: &str, context: &str) -> Result<QwenResult> { let start_time = Instant::now(); // Use optimized prompt structure for Qwen2.5-Coder let prompt = crate::prompts::build_semantic_analysis_prompt(query, context); // Build messages array for chat endpoint let messages = vec![ Message { role: "system".to_string(), content: "You are a code analysis expert using Qwen2.5-Coder. Provide detailed, structured analysis of codebases with specific examples and insights.".to_string(), }, Message { role: "user".to_string(), content: prompt, }, ]; let request = OllamaRequest { model: self.config.model_name.clone(), messages, stream: false, options: OllamaOptions { temperature: self.config.temperature, num_predict: self.config.max_tokens, num_ctx: self.config.context_window, }, }; debug!( "Sending analysis request to Qwen2.5-Coder: {} context window", self.config.context_window ); eprintln!( "Qwen documentation request started (max_tokens={} timeout={:?})", self.config.max_tokens, self.config.request_timeout ); let response = self .client .post(&format!("{}/api/chat", self.config.base_url)) .json(&request) .send() .await .map_err(|e| CodeGraphError::Network(format!("Qwen request failed: {}", e)))?; if !response.status().is_success() { let error_text = response .text() .await .unwrap_or_else(|_| "Unknown error".to_string()); return Err(CodeGraphError::External(format!( "Qwen API error: {}", error_text ))); } let response_data: OllamaResponse = response .json() .await .map_err(|e| CodeGraphError::Parse(format!("Failed to parse Qwen response: {}", e)))?; let processing_time = start_time.elapsed(); // Extract response text from message let response_text = response_data .message .map(|msg| msg.content) .unwrap_or_else(|| "No response generated".to_string()); let confidence_score = self.calculate_confidence(&response_text); let result = QwenResult { text: response_text, model_used: self.config.model_name.clone(), processing_time, context_tokens: response_data.prompt_eval_count.unwrap_or(0), completion_tokens: response_data.eval_count.unwrap_or(0), confidence_score, }; // Log to stderr to avoid polluting STDIO MCP transport eprintln!( "Qwen analysis completed: {}ms, context: {} tokens, completion: {} tokens, confidence: {:.2}", processing_time.as_millis(), result.context_tokens, result.completion_tokens, result.confidence_score ); Ok(result) } /// Check if Qwen2.5-Coder model is available pub async fn check_availability(&self) -> Result<bool> { debug!( "Checking Qwen2.5-Coder availability at {}", self.config.base_url ); let response = self .client .get(&format!("{}/api/tags", self.config.base_url)) .send() .await .map_err(|e| { CodeGraphError::Network(format!("Qwen availability check failed: {}", e)) })?; if !response.status().is_success() { return Ok(false); } let models: serde_json::Value = response .json() .await .map_err(|_| CodeGraphError::Parse("Failed to parse models response".to_string()))?; let has_qwen = models["models"] .as_array() .map(|models| { models.iter().any(|model| { model["name"] .as_str() .map(|name| { name.contains("qwen") && name.contains("coder") || name.contains("qwen2.5-coder") || name.contains("Qwen2.5-Coder") || name == self.config.model_name // Exact match }) .unwrap_or(false) }) }) .unwrap_or(false); info!("Qwen2.5-Coder availability: {}", has_qwen); Ok(has_qwen) } fn calculate_confidence(&self, response: &str) -> f32 { let mut confidence: f32 = 0.5; // Structured response indicates higher confidence if response.contains("1.") && response.contains("2.") { confidence += 0.2; } // Code examples indicate thorough analysis if response.contains("```") { confidence += 0.1; } // Detailed responses indicate comprehensive analysis if response.len() > 1000 { confidence += 0.1; } // Technical terminology indicates code understanding if response.contains("function") || response.contains("class") || response.contains("module") { confidence += 0.1; } confidence.min(0.95) // Cap at 95% } }

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Jakedismo/codegraph-rust'

If you have feedback or need assistance with the MCP directory API, please join our Discord server