Polymarket MCP Server

rate_limiter.py•9.08 KiB

""" Rate limiter implementation using token bucket algorithm. Respects Polymarket's API rate limits across different endpoint categories. """ import asyncio import time from collections import defaultdict from dataclasses import dataclass from enum import Enum from typing import Dict, Optional import logging logger = logging.getLogger(__name__) class EndpointCategory(Enum): """Polymarket API endpoint categories with different rate limits""" CLOB_GENERAL = "clob_general" # 5000/10s MARKET_DATA = "market_data" # 200/10s (/book, /price) BATCH_OPS = "batch_ops" # 80/10s TRADING_BURST = "trading_burst" # 2400/10s TRADING_SUSTAINED = "trading_sustained" # 24000/10min GAMMA_API = "gamma_api" # 750/10s DATA_API = "data_api" # 200/10s @dataclass class RateLimitConfig: """Configuration for a rate limit bucket""" max_tokens: int # Maximum tokens in bucket refill_rate: float # Tokens per second window_seconds: float # Time window for rate limit # Rate limit configurations for each endpoint category RATE_LIMITS: Dict[EndpointCategory, RateLimitConfig] = { EndpointCategory.CLOB_GENERAL: RateLimitConfig( max_tokens=5000, refill_rate=500.0, # 5000/10s window_seconds=10.0 ), EndpointCategory.MARKET_DATA: RateLimitConfig( max_tokens=200, refill_rate=20.0, # 200/10s window_seconds=10.0 ), EndpointCategory.BATCH_OPS: RateLimitConfig( max_tokens=80, refill_rate=8.0, # 80/10s window_seconds=10.0 ), EndpointCategory.TRADING_BURST: RateLimitConfig( max_tokens=2400, refill_rate=240.0, # 2400/10s window_seconds=10.0 ), EndpointCategory.TRADING_SUSTAINED: RateLimitConfig( max_tokens=24000, refill_rate=40.0, # 24000/10min = 40/s window_seconds=600.0 ), EndpointCategory.GAMMA_API: RateLimitConfig( max_tokens=750, refill_rate=75.0, # 750/10s window_seconds=10.0 ), EndpointCategory.DATA_API: RateLimitConfig( max_tokens=200, refill_rate=20.0, # 200/10s window_seconds=10.0 ), } class TokenBucket: """ Token bucket implementation for rate limiting. The bucket starts full and tokens are consumed on each request. Tokens refill at a constant rate over time. """ def __init__(self, config: RateLimitConfig): self.max_tokens = config.max_tokens self.refill_rate = config.refill_rate self.tokens = float(config.max_tokens) self.last_refill = time.monotonic() self._lock = asyncio.Lock() def _refill(self) -> None: """Refill tokens based on elapsed time""" now = time.monotonic() elapsed = now - self.last_refill # Add tokens based on elapsed time new_tokens = elapsed * self.refill_rate self.tokens = min(self.max_tokens, self.tokens + new_tokens) self.last_refill = now async def acquire(self, tokens: int = 1) -> float: """ Acquire tokens from the bucket. Blocks if insufficient tokens available. Args: tokens: Number of tokens to acquire Returns: float: Time waited in seconds """ async with self._lock: wait_time = 0.0 while True: self._refill() if self.tokens >= tokens: self.tokens -= tokens logger.debug( f"Acquired {tokens} tokens. Remaining: {self.tokens:.2f}/{self.max_tokens}" ) return wait_time # Calculate wait time for sufficient tokens tokens_needed = tokens - self.tokens sleep_time = tokens_needed / self.refill_rate # Add small buffer to avoid tight loops sleep_time = max(sleep_time, 0.01) logger.debug( f"Insufficient tokens ({self.tokens:.2f}/{tokens}). " f"Waiting {sleep_time:.2f}s" ) await asyncio.sleep(sleep_time) wait_time += sleep_time def available_tokens(self) -> int: """Get current number of available tokens""" self._refill() return int(self.tokens) class RateLimiter: """ Rate limiter managing multiple token buckets for different endpoint categories. Features: - Separate buckets per endpoint category - Automatic queuing when limit reached - Exponential backoff on 429 errors - Thread-safe async operations """ def __init__(self): self.buckets: Dict[EndpointCategory, TokenBucket] = {} self._429_backoff: Dict[EndpointCategory, float] = defaultdict(float) self._backoff_lock = asyncio.Lock() # Initialize buckets for each category for category, config in RATE_LIMITS.items(): self.buckets[category] = TokenBucket(config) async def acquire( self, category: EndpointCategory, tokens: int = 1, retry_on_429: bool = True ) -> float: """ Acquire rate limit tokens before making API request. Args: category: Endpoint category tokens: Number of tokens to acquire (default 1) retry_on_429: Whether to apply backoff if 429 was recently seen Returns: float: Total time waited in seconds """ bucket = self.buckets.get(category) if not bucket: logger.warning(f"Unknown category: {category}. No rate limiting applied.") return 0.0 total_wait = 0.0 # Apply 429 backoff if needed if retry_on_429: async with self._backoff_lock: backoff_until = self._429_backoff.get(category, 0.0) now = time.monotonic() if backoff_until > now: wait_time = backoff_until - now logger.warning( f"429 backoff active for {category.value}. " f"Waiting {wait_time:.2f}s" ) await asyncio.sleep(wait_time) total_wait += wait_time # Acquire tokens from bucket wait_time = await bucket.acquire(tokens) total_wait += wait_time return total_wait async def handle_429_error( self, category: EndpointCategory, retry_after: Optional[int] = None ) -> None: """ Handle 429 Too Many Requests error with exponential backoff. Args: category: Endpoint category that received 429 retry_after: Retry-After header value in seconds (if provided) """ async with self._backoff_lock: now = time.monotonic() current_backoff = self._429_backoff.get(category, 0.0) if retry_after: # Use server-provided retry-after backoff_time = float(retry_after) else: # Exponential backoff: start at 1s, double each time, max 60s if current_backoff > now: # Already in backoff, double it remaining = current_backoff - now backoff_time = min(remaining * 2, 60.0) else: # First 429 in a while, start with 1s backoff_time = 1.0 backoff_until = now + backoff_time self._429_backoff[category] = backoff_until logger.warning( f"429 error for {category.value}. " f"Setting backoff for {backoff_time:.2f}s" ) def get_status(self) -> Dict[str, Dict[str, any]]: """ Get current status of all rate limit buckets. Returns: Dict with status for each category """ status = {} now = time.monotonic() for category, bucket in self.buckets.items(): backoff_remaining = max(0.0, self._429_backoff.get(category, 0.0) - now) status[category.value] = { "available_tokens": bucket.available_tokens(), "max_tokens": bucket.max_tokens, "refill_rate_per_sec": bucket.refill_rate, "backoff_remaining_sec": backoff_remaining, "is_throttled": backoff_remaining > 0 } return status def reset_backoff(self, category: Optional[EndpointCategory] = None) -> None: """ Reset 429 backoff for a category or all categories. Args: category: Category to reset, or None to reset all """ if category: self._429_backoff[category] = 0.0 logger.info(f"Reset backoff for {category.value}") else: self._429_backoff.clear() logger.info("Reset all backoffs") # Singleton instance _rate_limiter: Optional[RateLimiter] = None def get_rate_limiter() -> RateLimiter: """Get or create the singleton rate limiter instance""" global _rate_limiter if _rate_limiter is None: _rate_limiter = RateLimiter() return _rate_limiter

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/caiovicentino/polymarket-mcp-server'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

rate_limiter.py•9.08 KiB