Web Search MCP

Overview Schema Related Servers Score Discussions

search.py•3.71 KiB

"""Core search logic — framework-agnostic, used by both FastAPI and MCP server.""" from __future__ import annotations import asyncio import logging import time from datetime import datetime, timezone from src.api.schemas import ( SearchMetadata, SearchRequest, SearchResponse, ) from src.config import SearchEngine from src.engine.base import BaseSearchEngine from src.engine.bing import BingSearchEngine from src.engine.duckduckgo import DuckDuckGoSearchEngine from src.engine.google import GoogleSearchEngine from src.scraper.browser import BrowserPool from src.scraper.depth import crawl_results, fetch_page_content from src.scraper.parser import extract_main_content_markdown logger = logging.getLogger(__name__) class SearchError(Exception): """Raised when a search cannot be performed.""" ENGINES: dict[SearchEngine, BaseSearchEngine] = { SearchEngine.GOOGLE: GoogleSearchEngine(), SearchEngine.BING: BingSearchEngine(), SearchEngine.DUCKDUCKGO: DuckDuckGoSearchEngine(), } FALLBACK_ORDER: dict[SearchEngine, list[SearchEngine]] = { SearchEngine.GOOGLE: [SearchEngine.DUCKDUCKGO, SearchEngine.BING], SearchEngine.BING: [SearchEngine.DUCKDUCKGO, SearchEngine.GOOGLE], SearchEngine.DUCKDUCKGO: [SearchEngine.BING, SearchEngine.GOOGLE], } async def do_search(pool: BrowserPool, req: SearchRequest) -> SearchResponse: """Execute a search with engine fallback and multi-depth crawling.""" if not pool._started: raise SearchError("Browser pool not initialized") start = time.monotonic() total_timeout = req.timeout or 25 async def _inner() -> SearchResponse: used_engine = req.engine async with pool.acquire() as page: engine = ENGINES[req.engine] results = await engine.search(page, req.query, req.max_results) if not results: for fallback in FALLBACK_ORDER.get(req.engine, []): logger.info( "Engine %s returned 0 results, falling back to %s", req.engine.value, fallback.value, ) fb_engine = ENGINES[fallback] results = await fb_engine.search(page, req.query, req.max_results) if results: used_engine = fallback break # Depth crawling with remaining time budget elapsed_so_far = time.monotonic() - start remaining = max(5, total_timeout - elapsed_so_far) results = await crawl_results(pool, results, depth=req.depth, timeout=int(remaining)) elapsed = int((time.monotonic() - start) * 1000) return SearchResponse( query=req.query, engine=used_engine, depth=req.depth, total=len(results), results=results, metadata=SearchMetadata( elapsed_ms=elapsed, timestamp=datetime.now(timezone.utc).isoformat(), engine=used_engine, depth=req.depth, ), ) try: return await asyncio.wait_for(_inner(), timeout=total_timeout) except asyncio.TimeoutError: elapsed = int((time.monotonic() - start) * 1000) logger.warning("do_search timed out after %dms (limit=%ds)", elapsed, total_timeout) raise SearchError(f"Search timed out after {total_timeout}s") async def fetch_url_content(pool: BrowserPool, url: str, timeout: int = 30) -> str: """Fetch a single URL and return its main content as markdown.""" async with pool.acquire() as page: html = await fetch_page_content(page, url, timeout) if not html: return "" return extract_main_content_markdown(html)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/uk0/web-search-fast'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

search.py•3.71 KiB