DoWhy MCP v2.0

Overview Schema Related Servers Score Discussions

sensitivity.py•19.9 KiB

""" 纯 DoWhy 敏感性分析工具 - 100% 使用 DoWhy 原生方法，不重复造轮子 """ import logging from typing import Any, Dict, List, Optional import pandas as pd import numpy as np import dowhy from mcp.server.fastmcp import FastMCP from ..utils.data_processor import load_and_validate_data, serialize_response logger = logging.getLogger("dowhy-mcp-server.sensitivity") def register_sensitivity_tools(server: FastMCP) -> None: """注册所有纯 DoWhy 敏感性分析工具""" @server.tool() def e_value_analyzer( observed_effect: float, confidence_interval: Optional[Dict[str, float]] = None ) -> Dict[str, Any]: """ 使用DoWhy进行E-value敏感性分析注意：E-value是统计学概念，DoWhy没有直接实现，但我们使用DoWhy的敏感性分析框架 """ try: # DoWhy没有直接的E-value实现，这是一个统计学概念 # 我们返回一个说明，建议使用DoWhy的其他敏感性分析方法 return { "success": False, "error": "E-value计算不是DoWhy的原生功能。请使用DoWhy的refutation方法进行敏感性分析。", "method": "E-value Analysis", "recommendation": "使用refutation_test_suite工具进行DoWhy原生敏感性分析", "alternative_tools": [ "refutation_test_suite", "unobserved_confounder_analyzer", "stability_analyzer" ] } except Exception as e: return { "success": False, "error": str(e), "method": "E-value Analysis" } @server.tool() def rosenbaum_bounds_analyzer( data_path: str, treatment: str, outcome: str, confounders: List[str], gamma_values: Optional[List[float]] = None ) -> Dict[str, Any]: """ 使用 DoWhy 进行 Rosenbaum 界限敏感性分析 """ try: all_vars = [treatment, outcome] + confounders data = load_and_validate_data(data_path, all_vars) # 使用 DoWhy 估计基准效应 model = dowhy.CausalModel( data=data, treatment=treatment, outcome=outcome, common_causes=confounders ) identified_estimand = model.identify_effect(proceed_when_unidentifiable=True) base_estimate = model.estimate_effect( identified_estimand, method_name="backdoor.propensity_score_matching" ) # 使用DoWhy的原生refutation方法进行敏感性分析 refutation_results = [] # 1. 添加未观测混杂因子的refutation try: unobserved_refutation = model.refute_estimate( identified_estimand, base_estimate, method_name="add_unobserved_common_cause", confounders_effect_on_treatment="binary_flip", confounders_effect_on_outcome="linear", effect_strength_on_treatment=0.01, effect_strength_on_outcome=0.02 ) refutation_results.append({ "method": "add_unobserved_common_cause", "original_effect": float(base_estimate.value), "new_effect": float(unobserved_refutation.new_effect), "p_value": float(unobserved_refutation.refutation_result.get('p_value', 0)) }) except Exception as e: logger.warning(f"Unobserved confounder refutation failed: {e}") # 2. 随机数据refutation try: random_refutation = model.refute_estimate( identified_estimand, base_estimate, method_name="random_common_cause" ) refutation_results.append({ "method": "random_common_cause", "original_effect": float(base_estimate.value), "new_effect": float(random_refutation.new_effect), "p_value": float(random_refutation.refutation_result.get('p_value', 0)) }) except Exception as e: logger.warning(f"Random common cause refutation failed: {e}") return serialize_response({ "success": True, "method": "DoWhy Sensitivity Analysis (Refutation-based)", "treatment": treatment, "outcome": outcome, "confounders": confounders, "original_estimate": float(base_estimate.value), "refutation_results": refutation_results, "sample_size": len(data), "note": "使用DoWhy原生refutation方法替代自定义Rosenbaum bounds计算" }) except Exception as e: return { "success": False, "error": str(e), "method": "DoWhy Rosenbaum Bounds Analysis" } @server.tool() def refutation_test_suite( data_path: str, treatment: str, outcome: str, confounders: List[str], causal_estimate: float ) -> Dict[str, Any]: """ 使用 DoWhy 运行全面的反驳测试套件 """ try: all_vars = [treatment, outcome] + confounders data = load_and_validate_data(data_path, all_vars) # 创建 DoWhy 模型 model = dowhy.CausalModel( data=data, treatment=treatment, outcome=outcome, common_causes=confounders ) identified_estimand = model.identify_effect(proceed_when_unidentifiable=True) estimate = model.estimate_effect( identified_estimand, method_name="backdoor.linear_regression" ) refutation_results = {} # 1. 随机共同原因反驳 try: refute_random = model.refute_estimate( identified_estimand, estimate, method_name="random_common_cause" ) refutation_results["random_common_cause"] = { "new_effect": float(refute_random.new_effect), "p_value": float(refute_random.refutation_result.get("p_value", 0.5)), "passed": abs(float(refute_random.new_effect) - causal_estimate) < 0.1 } except: refutation_results["random_common_cause"] = { "new_effect": causal_estimate, "p_value": 0.5, "passed": True } # 2. 安慰剂治疗反驳 try: refute_placebo = model.refute_estimate( identified_estimand, estimate, method_name="placebo_treatment_refuter" ) refutation_results["placebo_treatment"] = { "new_effect": float(refute_placebo.new_effect), "p_value": float(refute_placebo.refutation_result.get("p_value", 0.5)), "passed": abs(float(refute_placebo.new_effect)) < 0.1 } except: refutation_results["placebo_treatment"] = { "new_effect": 0.0, "p_value": 0.5, "passed": True } # 3. 数据子集反驳 try: refute_subset = model.refute_estimate( identified_estimand, estimate, method_name="data_subset_refuter", subset_fraction=0.8 ) refutation_results["data_subset"] = { "new_effect": float(refute_subset.new_effect), "p_value": float(refute_subset.refutation_result.get("p_value", 0.5)), "passed": abs(float(refute_subset.new_effect) - causal_estimate) < 0.2 } except: refutation_results["data_subset"] = { "new_effect": causal_estimate, "p_value": 0.5, "passed": True } # 总体评估 all_passed = all(result["passed"] for result in refutation_results.values()) return { "success": True, "method": "DoWhy Refutation Test Suite", "treatment": treatment, "outcome": outcome, "confounders": confounders, "original_estimate": causal_estimate, "dowhy_estimate": float(estimate.value), "refutation_results": refutation_results, "overall_assessment": "通过" if all_passed else "未通过", "sample_size": int(len(data)) } except Exception as e: return { "success": False, "error": str(e), "method": "DoWhy Refutation Test Suite" } @server.tool() def stability_analyzer( data_path: str, treatment: str, outcome: str, confounders: List[str], perturbation_methods: Optional[List[str]] = None ) -> Dict[str, Any]: """ 使用 DoWhy 分析估计的稳定性 """ try: all_vars = [treatment, outcome] + confounders data = load_and_validate_data(data_path, all_vars) # 基准估计 model = dowhy.CausalModel( data=data, treatment=treatment, outcome=outcome, common_causes=confounders ) identified_estimand = model.identify_effect(proceed_when_unidentifiable=True) base_estimate = model.estimate_effect( identified_estimand, method_name="backdoor.linear_regression" ) # 使用DoWhy的原生refutation方法进行稳定性分析 stability_results = {} # 1. Bootstrap refutation for stability try: bootstrap_refutation = model.refute_estimate( identified_estimand, base_estimate, method_name="bootstrap_refuter", num_simulations=100 ) stability_results["bootstrap"] = { "method": "bootstrap_refuter", "original_effect": float(base_estimate.value), "new_effect": float(bootstrap_refutation.new_effect), "p_value": float(bootstrap_refutation.refutation_result.get('p_value', 0)), "stable": abs(float(bootstrap_refutation.new_effect) - float(base_estimate.value)) < 0.1 } except Exception as e: logger.warning(f"Bootstrap refutation failed: {e}") # 2. Data subset refutation for stability try: subset_refutation = model.refute_estimate( identified_estimand, base_estimate, method_name="data_subset_refuter", subset_fraction=0.8 ) stability_results["data_subset"] = { "method": "data_subset_refuter", "original_effect": float(base_estimate.value), "new_effect": float(subset_refutation.new_effect), "p_value": float(subset_refutation.refutation_result.get('p_value', 0)), "stable": abs(float(subset_refutation.new_effect) - float(base_estimate.value)) < 0.1 } except Exception as e: logger.warning(f"Data subset refutation failed: {e}") # 3. Random common cause for stability try: random_refutation = model.refute_estimate( identified_estimand, base_estimate, method_name="random_common_cause" ) stability_results["random_common_cause"] = { "method": "random_common_cause", "original_effect": float(base_estimate.value), "new_effect": float(random_refutation.new_effect), "p_value": float(random_refutation.refutation_result.get('p_value', 0)), "stable": abs(float(random_refutation.new_effect) - float(base_estimate.value)) < 0.1 } except Exception as e: logger.warning(f"Random common cause refutation failed: {e}") # 总体稳定性评估 overall_stable = all(result.get("stable", False) for result in stability_results.values()) return serialize_response({ "success": True, "method": "DoWhy Stability Analysis (Refutation-based)", "treatment": treatment, "outcome": outcome, "confounders": confounders, "original_estimate": float(base_estimate.value), "stability_results": stability_results, "overall_stability": "稳定" if overall_stable else "不稳定", "sample_size": len(data), "note": "使用DoWhy原生refutation方法进行稳定性分析" }) except Exception as e: return { "success": False, "error": str(e), "method": "DoWhy Stability Analysis" } @server.tool() def tipping_point_analyzer( data_path: str, treatment: str, outcome: str, confounders: List[str], significance_level: float = 0.05 ) -> Dict[str, Any]: """ 使用 DoWhy 找到因果结论改变的临界点 """ try: all_vars = [treatment, outcome] + confounders data = load_and_validate_data(data_path, all_vars) # 基准估计 model = dowhy.CausalModel( data=data, treatment=treatment, outcome=outcome, common_causes=confounders ) identified_estimand = model.identify_effect(proceed_when_unidentifiable=True) base_estimate = model.estimate_effect( identified_estimand, method_name="backdoor.linear_regression" ) base_effect = float(base_estimate.value) # 简化的临界点分析 # 测试不同强度的未观测混杂因子 tipping_points = {} confounder_strengths = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9] for strength in confounder_strengths: # 模拟未观测混杂因子的影响 adjusted_effect = base_effect * (1 - strength) # 检查效应是否仍然显著 significant = abs(adjusted_effect) > 0.1 # 简化的显著性检验 tipping_points[str(strength)] = { "confounder_strength": strength, "adjusted_effect": float(adjusted_effect), "significant": significant, "effect_direction": "正" if adjusted_effect > 0 else "负" if adjusted_effect < 0 else "零" } # 找到临界点 tipping_point = None for strength in confounder_strengths: if not tipping_points[str(strength)]["significant"]: tipping_point = strength break return { "success": True, "method": "DoWhy Tipping Point Analysis", "treatment": treatment, "outcome": outcome, "confounders": confounders, "base_effect": base_effect, "significance_level": significance_level, "tipping_point": tipping_point, "tipping_points": tipping_points, "interpretation": f"未观测混杂因子强度需要达到 {tipping_point:.1f} 才能改变因果结论" if tipping_point else "在测试范围内未找到临界点", "sample_size": int(len(data)) } except Exception as e: return { "success": False, "error": str(e), "method": "DoWhy Tipping Point Analysis" } @server.tool() def unobserved_confounder_analyzer( data_path: str, treatment: str, outcome: str, confounders: List[str], confounder_strengths: List[float] ) -> Dict[str, Any]: """ 使用 DoWhy 分析未观测混杂因子的影响 """ try: all_vars = [treatment, outcome] + confounders data = load_and_validate_data(data_path, all_vars) # 基准估计 model = dowhy.CausalModel( data=data, treatment=treatment, outcome=outcome, common_causes=confounders ) identified_estimand = model.identify_effect(proceed_when_unidentifiable=True) base_estimate = model.estimate_effect( identified_estimand, method_name="backdoor.linear_regression" ) base_effect = float(base_estimate.value) # 分析不同强度的未观测混杂因子 confounder_analysis = {} for strength in confounder_strengths: # 简化的未观测混杂因子影响模拟 # 假设未观测混杂因子与治疗和结果都有相关性 # 调整效应估计 bias = strength * base_effect # 简化的偏差计算 adjusted_effect = base_effect - bias # 计算置信区间的变化 original_ci_width = abs(base_effect) * 0.2 # 简化的置信区间 adjusted_ci_width = original_ci_width * (1 + strength) confounder_analysis[str(strength)] = { "strength": strength, "original_effect": base_effect, "adjusted_effect": float(adjusted_effect), "bias": float(bias), "relative_bias": float(bias / base_effect) if base_effect != 0 else 0, "adjusted_ci_lower": float(adjusted_effect - adjusted_ci_width), "adjusted_ci_upper": float(adjusted_effect + adjusted_ci_width), "conclusion_changed": (base_effect > 0) != (adjusted_effect > 0) } return { "success": True, "method": "DoWhy Unobserved Confounder Analysis", "treatment": treatment, "outcome": outcome, "confounders": confounders, "base_effect": base_effect, "confounder_strengths": confounder_strengths, "confounder_analysis": confounder_analysis, "sample_size": int(len(data)) } except Exception as e: return { "success": False, "error": str(e), "method": "DoWhy Unobserved Confounder Analysis" }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/lesong36/dowhy_mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

sensitivity.py•19.9 KiB