get_clinical_data

Retrieve patient clinical data from cancer studies with pagination support, enabling researchers to access specific attributes or comprehensive datasets for analysis.

Instructions

Get clinical data for patients in a study with pagination support. Can fetch specific attributes or all.

Input Schema

TableJSON Schema

Name	Required	Default
`study_id`	Yes
`attribute_ids`	No
`page_number`	No
`page_size`	No
`sort_by`	No
`direction`	No	ASC
`limit`	No

Implementation Reference

cbioportal_mcp/server.py:97-131 (registration)

Registers 'get_clinical_data' (line 119) and other methods as MCP tools by adding them to FastMCP instance.

"""Register tool methods as MCP tools."""
# List of methods to register as tools (explicitly defined)
tool_methods = [
    # Pagination utilities
    "paginate_results",
    "collect_all_results",
    # Studies endpoints
    "get_cancer_studies",
    "get_cancer_types",
    "search_studies",
    "get_study_details",
    "get_multiple_studies",
    # Genes endpoints
    "search_genes",
    "get_genes",
    "get_multiple_genes",
    "get_mutations_in_gene",
    # Samples endpoints
    "get_samples_in_study",
    "get_sample_list_id",
    # Molecular profiles endpoints
    "get_molecular_profiles",
    "get_clinical_data",
    "get_gene_panels_for_study",
    "get_gene_panel_details",
]

for method_name in tool_methods:
    if hasattr(self, method_name):
        method = getattr(self, method_name)
        self.mcp.add_tool(method)
        logger.debug(f"Registered tool: {method_name}")
    else:
        logger.warning(f"Method {method_name} not found for tool registration")

cbioportal_mcp/server.py:308-321 (handler)

MCP-exposed handler for get_clinical_data tool. Delegates execution to the molecular_profiles endpoint implementation.

async def get_clinical_data(
    self,
    study_id: str,
    attribute_ids: Optional[List[str]] = None,
    page_number: int = 0,
    page_size: int = 50,
    sort_by: Optional[str] = None,
    direction: str = "ASC",
    limit: Optional[int] = None,
) -> Dict:
    """Get clinical data for patients in a study with pagination support. Can fetch specific attributes or all."""
    return await self.molecular_profiles.get_clinical_data(
        study_id, attribute_ids, page_number, page_size, sort_by, direction, limit
    )

cbioportal_mcp/endpoints/molecular_profiles.py:83-179 (handler)

Primary implementation of get_clinical_data: validates inputs, calls cBioPortal API (GET/POST), processes raw clinical data into nested patient-attribute structure, applies pagination and limits.

@handle_api_errors("get clinical data")
async def get_clinical_data(
    self,
    study_id: str,
    attribute_ids: Optional[List[str]] = None,
    page_number: int = 0,
    page_size: int = 50,
    sort_by: Optional[str] = None,
    direction: str = "ASC",
    limit: Optional[int] = None,
) -> Dict:
    """
    Get clinical data for patients in a study with pagination support. Can fetch specific attributes or all.
    """
    try:
        api_call_params = {
            "pageNumber": page_number,
            "pageSize": page_size,
            "direction": direction,
            "clinicalDataType": "PATIENT",  # Assuming PATIENT level data
        }
        if sort_by:
            api_call_params["sortBy"] = sort_by
        if limit == 0:
            api_call_params["pageSize"] = FETCH_ALL_PAGE_SIZE

        clinical_data_from_api = []
        if attribute_ids:
            endpoint = f"studies/{study_id}/clinical-data/fetch"
            payload = {"attributeIds": attribute_ids, "clinicalDataType": "PATIENT"}
            clinical_data_from_api = await self.api_client.make_api_request(
                endpoint, method="POST", params=api_call_params, json_data=payload
            )
        else:
            endpoint = f"studies/{study_id}/clinical-data"
            clinical_data_from_api = await self.api_client.make_api_request(
                endpoint, method="GET", params=api_call_params
            )

        if (
            isinstance(clinical_data_from_api, dict)
            and "api_error" in clinical_data_from_api
        ):
            return {
                "error": "API error fetching clinical data",
                "details": clinical_data_from_api,
                "request_params": api_call_params,
            }
        if not isinstance(clinical_data_from_api, list):
            return {
                "error": "Unexpected API response type for clinical data (expected list)",
                "details": clinical_data_from_api,
                "request_params": api_call_params,
            }

        api_might_have_more = (
            len(clinical_data_from_api) == api_call_params["pageSize"]
        )
        if (
            api_call_params["pageSize"] == FETCH_ALL_PAGE_SIZE
            and len(clinical_data_from_api) < FETCH_ALL_PAGE_SIZE
        ):
            api_might_have_more = False

        # Apply server-side limit to the data that will be processed and returned
        data_to_process = clinical_data_from_api
        if limit and limit > 0 and len(clinical_data_from_api) > limit:
            data_to_process = clinical_data_from_api[:limit]

        by_patient = {}
        for item in data_to_process:
            patient_id = item.get("patientId")
            if patient_id:
                if patient_id not in by_patient:
                    by_patient[patient_id] = {}
                by_patient[patient_id][item.get("clinicalAttributeId")] = item.get(
                    "value"
                )

        # Update total_found to be the number of unique patients, not raw data items
        # This makes the count consistent with the actual returned data structure
        total_patients = len(by_patient)

        return {
            "clinical_data_by_patient": by_patient,  # This contains unique patients with their attributes
            "pagination": {
                "page": page_number,
                "page_size": page_size,
                "total_found": total_patients,  # Now using patient count for consistency
                "has_more": api_might_have_more,
            },
        }
    except Exception as e:
        return {
            "error": f"Failed to get clinical data for study {study_id}: {str(e)}"
        }

cBioPortal MCP Server