OrigeneMCP

OrigeneMCP
tools
clinicaltrials

clinicaltrials_api.py•9.78 kB

import requests import json from typing import Optional, Dict, List, Any, Union class ClinicalTrialsAPI: BASE_URL = "https://clinicaltrials.gov/api/v2/" def __init__(self): self.session = requests.Session() self.headers = { "accept": "application/json" } def _flatten_params(self, prefix: str, data: Optional[Dict[str, Any]]) -> Dict[str, Any]: if not data: return {} return {f"{prefix}.{k}": v for k, v in data.items()} def _get(self, endpoint: str, params: Optional[Dict[str, Any]] = None) -> Optional[Dict[str, Any]]: """Internal helper for GET requests.""" url = self.BASE_URL + endpoint try: r = requests.get(url, params=params, headers=self.headers) r.raise_for_status() return r.json() except requests.exceptions.HTTPError as err: print(f"HTTP error occurred: {err}") try: content_type = r.headers.get("Content-Type", "") if "application/json" in content_type: error_detail = r.json() print("Error details (JSON):") print(json.dumps(error_detail, indent=2)) else: print("Error details (text):") print(r.text) except Exception as e: print(f"Failed to parse error response: {e}") return None except Exception as err: print(f"Other error occurred: {err}") return None def get_studies( self, query: Optional[Dict[str, Any]] = None, filter: Optional[Dict[str, Any]] = None, post_filter: Optional[Dict[str, Any]] = None, fields: Optional[List[str]] = None, sort: Optional[List[str]] = None, page_size: int = 50, page_token: Optional[str] = None, format: str = "json", markup_format: str = "markdown", count_total: bool = False ) -> Dict[str, Any]: """ Query the /studies endpoint with support for structured query, filter, and postFilter parameters. Parameters: query (dict): Parameters for query.* fields (e.g., {"cond": "glioblastoma"}). filter (dict): Parameters for filter.* fields (e.g., {"overallStatus": "RECRUITING"}). post_filter (dict): Parameters for postFilter.* fields. fields (list of str): List of fields to return (e.g., ["NCTId", "BriefTitle"]). sort (list of str): Sort fields (e.g., ["@relevance", "EnrollmentCount:desc"]). page_size (int): Number of results per page (maximum 1000). page_token (str): Token for retrieving the next page. format (str): Response format, either "json" or "csv". markup_format (str): Markup formatting for text fields, either "markdown" or "legacy". count_total (bool): Whether to include the total number of studies. Returns: dict: A response object containing the list of studies, nextPageToken, and optional metadata. """ params = { "format": format, "markupFormat": markup_format, "pageSize": str(page_size), "countTotal": str(count_total).lower() } if page_token: params["pageToken"] = page_token if fields: params["fields"] = ",".join(fields) if sort: params["sort"] = ",".join(sort) # 合并嵌套参数组 params.update(self._flatten_params("query", query)) params.update(self._flatten_params("filter", filter)) params.update(self._flatten_params("postFilter", post_filter)) endpoint = "studies" response = self._get(endpoint, params=params) return response def get_study( self, nct_id: str, format: str = "json", markup_format: str = "markdown", fields: Optional[List[str]] = None ) -> Union[Dict[str, Any], bytes, None]: """ Retrieve details for a single clinical trial using its NCT ID. Args: nct_id (str): The NCT number of the study (e.g., "NCT04000165"). format (str): Response format. One of 'json', 'csv', 'json.zip', 'fhir.json', 'ris'. Default is 'json'. markup_format (str): Markup formatting for text fields. Only applicable when format is 'json' or 'json.zip'. Options are 'markdown' (default) or 'legacy'. fields (List[str], optional): List of fields to include in the response. Ignored if format is 'fhir.json'. Returns: dict: If format is 'json', returns a parsed JSON dictionary. bytes: For other formats (CSV, RIS, FHIR, ZIP), returns raw bytes content. None: If the request fails or an error occurs. """ params = {"format": format} if format in {"json", "json.zip"}: params["markupFormat"] = markup_format if fields and format != "fhir.json": params["fields"] = ",".join(fields) endpoint = f"studies/{nct_id}" response = self._get(endpoint, params=params) return response def get_metadata( self, include_indexed_only: bool = False, include_historic_only: bool = False ) -> Optional[Dict[str, Any]]: """ Retrieve the list of study data model fields. Args: include_indexed_only (bool): If True, include fields that are indexed only. include_historic_only (bool): If True, include fields available only in historic datasets. Returns: dict: Metadata describing all available fields in the study data model. """ params = { "includeIndexedOnly": str(include_indexed_only).lower(), "includeHistoricOnly": str(include_historic_only).lower() } endpoint = "studies/metadata" return self._get(endpoint, params=params) def get_search_areas(self) -> Optional[Dict[str, Any]]: """ Retrieve all available search documents and their search areas. Returns: dict: A dictionary describing all searchable documents and their corresponding areas. """ endpoint = "studies/search-areas" return self._get(endpoint) def get_enums(self) -> Optional[Dict[str, Any]]: """ Retrieve all enumeration types and their corresponding values. Returns: dict: A dictionary containing enum type names, the pieces using them, and all possible values including legacy mappings. """ endpoint = "studies/enums" return self._get(endpoint) def get_study_size_stats(self) -> Optional[Dict[str, Any]]: """ Retrieve statistics about the size of study records in JSON format. Returns: dict: Contains statistical information such as average, min, max, and total JSON size for all studies. """ endpoint = "stats/size" return self._get(endpoint) def get_field_value_stats( self, fields: List[str], types: Optional[List[str]] = None ) -> Optional[Dict[str, Any]]: """ Retrieve value statistics for one or more leaf-level fields. Args: fields (List[str]): List of field names or paths (e.g., ["Phase", "Condition"]). types (List[str], optional): Filter by data types. Options: ENUM, STRING, DATE, INTEGER, NUMBER, BOOLEAN. Returns: dict: A dictionary containing value distributions for each requested field. """ if not fields: raise ValueError("At least one field must be specified.") params = { "fields": ",".join(fields) } if types: params["types"] = ",".join(types) endpoint = "stats/field/values" return self._get(endpoint, params=params) def get_field_size_stats( self, fields: Optional[List[str]] = None ) -> Optional[Dict[str, Any]]: """ Retrieve size statistics for list/array fields. Args: fields (List[str], optional): List of field names or paths to filter on. If None, stats for all list fields will be returned. Returns: dict: A dictionary containing list size distributions for each specified field. """ params = {} if fields: params["fields"] = ",".join(fields) endpoint = "stats/field/sizes" return self._get(endpoint, params=params) if __name__ == "__main__": api = ClinicalTrialsAPI() result = api.get_studies( query={"cond": "lung cancer", "term": "AREA[StartDate]RANGE[2020,MAX]"}, filter={"overallStatus": "RECRUITING"}, fields=["NCTId", "BriefTitle", "OverallStatus"], sort=["@relevance"], page_size=30, count_total=True ) print(result) res = api.get_study("NCT04000165", fields=["NCTId", "BriefTitle"]) print(res) res = api.get_metadata() print(res) search_areas = api.get_search_areas() print(search_areas) stats = api.get_field_value_stats( fields=["Phase", "Condition"], types=["ENUM", "STRING"] )

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/GENTEL-lab/OrigeneMCP'

If you have feedback or need assistance with the MCP directory API, please join our Discord server