ContextForge MCP Gateway

Official

Overview Schema Related Servers Score Discussions

retry_manager.py•23.1 KiB

# -*- coding: utf-8 -*- """Location: ./mcpgateway/utils/retry_manager.py Copyright 2025 SPDX-License-Identifier: Apache-2.0 Authors: Keval Mahajan MCP Gateway Resilient HTTP Client with Retry Logic. This module provides a resilient HTTP client that automatically retries requests in the event of certain errors or status codes. It implements exponential backoff with jitter for retrying requests, making it suitable for use in environments where network reliability is a concern or when dealing with rate-limited APIs. Key Features: - Automatic retry logic for transient failures - Exponential backoff with configurable jitter - Support for HTTP 429 Retry-After headers - Configurable retry policies and delay parameters - Async context manager support for resource cleanup - Standard HTTP methods (GET, POST, PUT, DELETE) - Comprehensive error classification The client distinguishes between retryable and non-retryable errors: Retryable Status Codes: - 429 (Too Many Requests) - with Retry-After header support - 503 (Service Unavailable) - 502 (Bad Gateway) - 504 (Gateway Timeout) - 408 (Request Timeout) Non-Retryable Status Codes: - 400 (Bad Request) - 401 (Unauthorized) - 403 (Forbidden) - 404 (Not Found) - 405 (Method Not Allowed) - 406 (Not Acceptable) Retryable Network Errors: - Connection timeouts - Read timeouts - Network errors Dependencies: - Standard Library: asyncio, logging, random - Third-party: httpx - First-party: mcpgateway.config.settings Example Usage: Basic usage with default settings: >>> import asyncio >>> from mcpgateway.utils.retry_manager import ResilientHttpClient >>> >>> # Test client initialization and context manager >>> async def test_basic_usage(): ... async with ResilientHttpClient() as client: ... # Verify client is properly initialized ... assert client.max_retries > 0 ... assert client.base_backoff > 0 ... assert isinstance(client.client, httpx.AsyncClient) ... return True >>> # asyncio.run(test_basic_usage()) # Would return True Custom configuration: >>> # Test custom configuration >>> client = ResilientHttpClient( ... max_retries=5, ... base_backoff=2.0, ... max_delay=120.0 ... ) >>> client.max_retries 5 >>> client.base_backoff 2.0 >>> client.max_delay 120.0 >>> >>> # Test client cleanup >>> async def cleanup_test(): ... await client.aclose() ... return True >>> # asyncio.run(cleanup_test()) # Would properly close the client Testing retry behavior: >>> # Test that retryable errors are identified correctly >>> client = ResilientHttpClient() >>> client._should_retry(httpx.NetworkError("Network error"), None) True >>> >>> # Test non-retryable status codes >>> from unittest.mock import Mock >>> response_404 = Mock() >>> response_404.status_code = 404 >>> client._should_retry(Exception(), response_404) False >>> >>> # Test retryable status codes >>> response_503 = Mock() >>> response_503.status_code = 503 >>> client._should_retry(Exception(), response_503) True Testing HTTP methods: >>> # Verify all HTTP methods are available >>> client = ResilientHttpClient() >>> import inspect >>> all([ ... inspect.iscoroutinefunction(client.get), ... inspect.iscoroutinefunction(client.post), ... inspect.iscoroutinefunction(client.put), ... inspect.iscoroutinefunction(client.delete) ... ]) True Testing backoff calculation: >>> # Test exponential backoff calculation >>> client = ResilientHttpClient(base_backoff=1.0, jitter_max=0.5) >>> # First retry: 1.0 * (2^0) = 1.0 seconds base >>> # Second retry: 1.0 * (2^1) = 2.0 seconds base >>> # Third retry: 1.0 * (2^2) = 4.0 seconds base >>> client.base_backoff * (2**0) 1.0 >>> client.base_backoff * (2**1) 2.0 >>> client.base_backoff * (2**2) 4.0 Testing error classification: >>> # Verify error code sets >>> from mcpgateway.utils.retry_manager import RETRYABLE_STATUS_CODES, NON_RETRYABLE_STATUS_CODES >>> 429 in RETRYABLE_STATUS_CODES True >>> 503 in RETRYABLE_STATUS_CODES True >>> 400 in NON_RETRYABLE_STATUS_CODES True >>> 404 in NON_RETRYABLE_STATUS_CODES True >>> # Ensure no overlap between sets >>> len(RETRYABLE_STATUS_CODES & NON_RETRYABLE_STATUS_CODES) 0 """ # Standard import asyncio from contextlib import asynccontextmanager import logging import random from typing import Any, AsyncContextManager, Dict, Optional # Third-Party import httpx # First-Party from mcpgateway.config import settings # Configure logger logger = logging.getLogger(__name__) RETRYABLE_STATUS_CODES = { 429, # Too Many Requests 503, # Service Unavailable 502, # Bad Gateway 504, # Gateway Timeout 408, # Request Timeout } NON_RETRYABLE_STATUS_CODES = { 400, # Bad Request 401, # Unauthorized 403, # Forbidden 404, # Not Found 405, # Method Not Allowed 406, # Not Acceptable } class ResilientHttpClient: """A resilient HTTP client with automatic retry capabilities. This client automatically retries requests in the event of certain errors or status codes using exponential backoff with jitter. It's designed to handle transient network issues and rate limiting gracefully. The retry logic implements: - Exponential backoff: delay = base_backoff * (2 ** attempt) - Jitter: random additional delay to prevent thundering herd - Respect for HTTP 429 Retry-After headers - Maximum delay caps to prevent excessive waiting Attributes: max_retries: Maximum number of retry attempts base_backoff: Base delay in seconds before first retry max_delay: Maximum delay between retries in seconds jitter_max: Maximum jitter fraction (0-1) to add randomness client_args: Additional arguments for httpx.AsyncClient client: The underlying httpx.AsyncClient instance Examples: >>> # Test initialization with default values >>> client = ResilientHttpClient() >>> client.max_retries > 0 True >>> client.base_backoff > 0 True >>> client.max_delay > 0 True >>> isinstance(client.client, httpx.AsyncClient) True >>> # Test initialization with custom values >>> client = ResilientHttpClient(max_retries=5, base_backoff=2.0) >>> client.max_retries 5 >>> client.base_backoff 2.0 >>> # Test client_args parameter (limits added by default) >>> args = {"timeout": 30.0} >>> client = ResilientHttpClient(client_args=args) >>> client.client_args["timeout"] 30.0 >>> "limits" in client.client_args True """ def __init__( self, max_retries: int = settings.retry_max_attempts, base_backoff: float = settings.retry_base_delay, max_delay: float = settings.retry_max_delay, jitter_max: float = settings.retry_jitter_max, client_args: Optional[Dict[str, Any]] = None, ): """Initialize the ResilientHttpClient with configurable retry behavior. Args: max_retries: Maximum number of retry attempts before giving up base_backoff: Base delay in seconds before retrying a request max_delay: Maximum backoff delay in seconds jitter_max: Maximum jitter fraction (0-1) to add randomness client_args: Additional arguments to pass to httpx.AsyncClient Examples: >>> # Test default initialization >>> client = ResilientHttpClient() >>> client.max_retries >= 0 True >>> client.base_backoff >= 0 True >>> # Test parameter assignment >>> client = ResilientHttpClient(max_retries=10, base_backoff=5.0) >>> client.max_retries 10 >>> client.base_backoff 5.0 >>> # Test client_args handling (default limits added) >>> client = ResilientHttpClient(client_args=None) >>> "limits" in client.client_args True """ self.max_retries = max_retries self.base_backoff = base_backoff self.max_delay = max_delay self.jitter_max = jitter_max self.client_args = client_args or {} # Add default httpx.Limits if not provided for connection pooling if "limits" not in self.client_args: self.client_args["limits"] = httpx.Limits( max_connections=settings.httpx_max_connections, max_keepalive_connections=settings.httpx_max_keepalive_connections, keepalive_expiry=settings.httpx_keepalive_expiry, ) self.client = httpx.AsyncClient(**self.client_args) async def _sleep_with_jitter(self, base: float, jitter_range: float): """Sleep for a period with added jitter to prevent thundering herd. Implements jittered exponential backoff by adding random delay to the base sleep time. The total delay is capped at max_delay. Args: base: Base sleep time in seconds jitter_range: Maximum additional random delay in seconds Examples: >>> import asyncio >>> client = ResilientHttpClient() >>> # Test that method exists and is callable >>> callable(client._sleep_with_jitter) True >>> # Test delay calculation logic (without actual sleep) >>> base_time = 2.0 >>> jitter = 1.0 >>> # Simulate the delay calculation >>> import random >>> delay = base_time + random.uniform(0, jitter) >>> delay >= base_time True >>> delay <= base_time + jitter True """ # random.uniform() is safe here as jitter is only used for retry timing, not security delay = base + random.uniform(0, jitter_range) # nosec B311 # noqa: DUO102 # Ensure delay doesn't exceed the max allowed delay = min(delay, self.max_delay) await asyncio.sleep(delay) def _should_retry(self, exc: Exception, response: Optional[httpx.Response]) -> bool: """Determine whether a request should be retried. Evaluates the exception and response to decide if the request should be retried based on error type and HTTP status code. Args: exc: Exception raised during the request response: HTTP response object if available Returns: True if the request should be retried, False otherwise Examples: >>> client = ResilientHttpClient() >>> # Test network errors (should retry) >>> client._should_retry(httpx.ConnectTimeout("Connection timeout"), None) True >>> client._should_retry(httpx.ReadTimeout("Read timeout"), None) True >>> client._should_retry(httpx.NetworkError("Network error"), None) True >>> # Test non-retryable status codes >>> from unittest.mock import Mock >>> response_400 = Mock() >>> response_400.status_code = 400 >>> client._should_retry(Exception(), response_400) False >>> response_401 = Mock() >>> response_401.status_code = 401 >>> client._should_retry(Exception(), response_401) False >>> # Test retryable status codes >>> response_429 = Mock() >>> response_429.status_code = 429 >>> client._should_retry(Exception(), response_429) True >>> response_503 = Mock() >>> response_503.status_code = 503 >>> client._should_retry(Exception(), response_503) True >>> # Test unknown status codes (should not retry) >>> response_418 = Mock() >>> response_418.status_code = 418 >>> client._should_retry(Exception(), response_418) False """ if isinstance(exc, (httpx.ConnectTimeout, httpx.ReadTimeout, httpx.NetworkError)): return True if response: if response.status_code in NON_RETRYABLE_STATUS_CODES: logger.info(f"Response {response.status_code}: Not retrying.") return False if response.status_code in RETRYABLE_STATUS_CODES: logger.info(f"Response {response.status_code}: Retrying.") return True return False async def request(self, method: str, url: str, **kwargs) -> httpx.Response: """Make a resilient HTTP request with automatic retries. Performs an HTTP request with automatic retry logic for transient failures. Implements exponential backoff with jitter and respects HTTP 429 Retry-After headers. Args: method: HTTP method (GET, POST, PUT, DELETE, etc.) url: Target URL for the request **kwargs: Additional parameters to pass to httpx.request Returns: HTTP response object from the successful request Raises: httpx.HTTPError: For non-retryable HTTP errors or when max retries exceeded last_exc: The last exception encountered during the retries, raised if the request ultimately fails after all retry attempts. Exception: The last exception encountered if all retries fail Note: This method requires actual HTTP connectivity for complete testing. Doctests focus on validating method existence and basic parameter handling without making actual network requests. Examples: >>> client = ResilientHttpClient() >>> # Test method exists and is callable >>> callable(client.request) True >>> # Test parameter validation >>> import asyncio >>> # Method should accept string parameters >>> method = "GET" >>> url = "https://example.com" >>> isinstance(method, str) and isinstance(url, str) True """ attempt = 0 last_exc = None response = None while attempt < self.max_retries: try: logger.debug(f"Attempt {attempt + 1} to {method} {url}") response = await self.client.request(method, url, **kwargs) if response.status_code in NON_RETRYABLE_STATUS_CODES or response.is_success: return response # Handle 429 - Retry-After header if response.status_code == 429: retry_after = response.headers.get("Retry-After") if retry_after: retry_after_sec = float(retry_after) logger.info(f"Rate-limited. Retrying after {retry_after_sec}s.") await asyncio.sleep(retry_after_sec) attempt += 1 continue if not self._should_retry(Exception(), response): return response except Exception as exc: if not self._should_retry(exc, None): raise last_exc = exc logger.warning(f"Retrying due to error: {exc}") # Backoff calculation delay = self.base_backoff * (2**attempt) jitter = delay * self.jitter_max await self._sleep_with_jitter(delay, jitter) attempt += 1 logger.debug(f"Retry scheduled after delay of {delay:.2f} seconds.") if last_exc: raise last_exc logger.error(f"Max retries reached for {url}") return response async def get(self, url: str, **kwargs): """Make a resilient GET request. Args: url: URL to send the GET request to **kwargs: Additional parameters to pass to the request Returns: HTTP response object from the GET request Examples: >>> client = ResilientHttpClient() >>> callable(client.get) True >>> # Verify it's an async method >>> import inspect >>> inspect.iscoroutinefunction(client.get) True """ return await self.request("GET", url, **kwargs) async def post(self, url: str, **kwargs): """Make a resilient POST request. Args: url: URL to send the POST request to **kwargs: Additional parameters to pass to the request Returns: HTTP response object from the POST request Examples: >>> client = ResilientHttpClient() >>> callable(client.post) True >>> import inspect >>> inspect.iscoroutinefunction(client.post) True """ return await self.request("POST", url, **kwargs) async def put(self, url: str, **kwargs): """Make a resilient PUT request. Args: url: URL to send the PUT request to **kwargs: Additional parameters to pass to the request Returns: HTTP response object from the PUT request Examples: >>> client = ResilientHttpClient() >>> callable(client.put) True >>> import inspect >>> inspect.iscoroutinefunction(client.put) True """ return await self.request("PUT", url, **kwargs) async def delete(self, url: str, **kwargs): """Make a resilient DELETE request. Args: url: URL to send the DELETE request to **kwargs: Additional parameters to pass to the request Returns: HTTP response object from the DELETE request Examples: >>> client = ResilientHttpClient() >>> callable(client.delete) True >>> import inspect >>> inspect.iscoroutinefunction(client.delete) True """ return await self.request("DELETE", url, **kwargs) @asynccontextmanager async def stream(self, method: str, url: str, **kwargs) -> AsyncContextManager[httpx.Response]: """Open a resilient streaming HTTP request. Args: method: HTTP method to use (e.g. "GET", "POST") url: URL to send the request to **kwargs: Additional parameters to pass to the request Yields: HTTP response object with streaming capability Raises: Exception: If a non-retryable error occurs while opening the stream RuntimeError: If the maximum number of retries is exceeded Examples: >>> client = ResilientHttpClient() >>> import contextlib >>> isinstance(client.stream("GET", "https://example.com"), contextlib.AbstractAsyncContextManager) True >>> async def fetch(): ... async with client.stream("GET", "https://example.com") as response: ... async for chunk in response.aiter_bytes(): ... print(chunk) """ attempt = 0 last_exc: Optional[Exception] = None while attempt < self.max_retries: try: logging.debug("Attempt %d (stream) %s %s", attempt + 1, method, url) stream_cm = self.client.stream(method, url, **kwargs) async with stream_cm as resp: if not (200 <= resp.status_code < 300 or resp.is_success): if resp.status_code == 429: ra = resp.headers.get("Retry-After") if ra: try: wait = float(ra) except ValueError: wait = None if wait: logging.info("Rate-limited. Sleeping Retry-After=%s", wait) await asyncio.sleep(wait) attempt += 1 continue if not self._should_retry(None, resp): # give caller the error response once and return yield resp return logging.info("Stream response %s considered retryable; will retry opening.", resp.status_code) else: # good response -> yield it to caller yield resp return except Exception as exc: last_exc = exc if not self._should_retry(exc, None): raise logging.warning("Error opening stream (will retry): %s", exc) backoff = self.base_backoff * (2**attempt) jitter_range = backoff * self.jitter_max await self._sleep_with_jitter(backoff, jitter_range) attempt += 1 logging.debug("Retrying stream open (attempt %d) after backoff %.2f", attempt + 1, backoff) if last_exc: raise RuntimeError(last_exc) raise RuntimeError("Max retries reached opening stream") async def aclose(self): """Close the underlying HTTP client gracefully. Ensures proper cleanup of the httpx.AsyncClient and its resources. Examples: >>> client = ResilientHttpClient() >>> callable(client.aclose) True >>> import inspect >>> inspect.iscoroutinefunction(client.aclose) True """ await self.client.aclose() async def __aenter__(self): """Asynchronous context manager entry point. Returns: The client instance for use in async with statements Examples: >>> client = ResilientHttpClient() >>> callable(client.__aenter__) True >>> import inspect >>> inspect.iscoroutinefunction(client.__aenter__) True """ return self async def __aexit__(self, *args): """Asynchronous context manager exit point. Ensures the HTTP client is properly closed after use, even if exceptions occur during the context manager block. Args: *args: Exception information passed by the context manager (exc_type, exc_value, traceback) or None values if no exception Examples: >>> client = ResilientHttpClient() >>> callable(client.__aexit__) True >>> import inspect >>> inspect.iscoroutinefunction(client.__aexit__) True """ await self.aclose()

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/IBM/mcp-context-forge'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

retry_manager.py•23.1 KiB