Jij MCP Server

Official

Overview Schema Related Servers Score Discussions

fetcher.py•5.77 KiB

import httpx from bs4 import BeautifulSoup from markdownify import MarkdownConverter from typing import Dict, Optional, Any import json from .types import FetchRequestArgs, FetchResponse class NoImagesConverter(MarkdownConverter): """ Create a custom MarkdownConverter that ignores all images during conversion """ def convert_img(self, el, text, parent_tags): # Return empty string instead of converting the image return "" class Fetcher: """Handles fetching and processing web content.""" DEFAULT_HEADERS = { "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36 Jij-MCP/0.1 (+https://github.com/Jij-Inc/Jij-MCP-Server)" } @staticmethod async def _fetch(payload: FetchRequestArgs) -> httpx.Response: """Internal fetch method using httpx.""" headers = Fetcher.DEFAULT_HEADERS.copy() if payload.headers: headers.update(payload.headers) async with httpx.AsyncClient(follow_redirects=True, timeout=30.0) as client: try: response = await client.get( str(payload.url), headers=headers ) # HttpUrlをstrに変換 response.raise_for_status() # Raises HTTPStatusError for 4xx/5xx responses return response except httpx.HTTPStatusError as e: raise ConnectionError( f"HTTP error: {e.response.status_code} for url: {e.request.url}" ) from e except httpx.RequestError as e: raise ConnectionError( f"Failed to fetch {payload.url}: {type(e).__name__}" ) from e except Exception as e: # Handle potential URL parsing issues or other unexpected errors raise ConnectionError( f"An unexpected error occurred for {payload.url}: {e}" ) from e @staticmethod async def html(payload: FetchRequestArgs) -> FetchResponse: """Fetches content as raw HTML.""" try: response = await Fetcher._fetch(payload) html_content = await response.aread() # Read as bytes # Try decoding with UTF-8 first, then fallback or use detected encoding try: html_text = html_content.decode("utf-8") except UnicodeDecodeError: # Fallback using detected encoding or a robust alternative detected_encoding = ( response.encoding or "iso-8859-1" ) # Default fallback html_text = html_content.decode(detected_encoding, errors="replace") return FetchResponse( content=[{"type": "text", "text": html_text}], isError=False ) except Exception as e: return FetchResponse(content=[], isError=True, errorMessage=str(e)) @staticmethod async def json(payload: FetchRequestArgs) -> FetchResponse: """Fetches content and parses it as JSON.""" try: response = await Fetcher._fetch(payload) # httpx's response.json() handles decoding json_content = ( response.json() ) # Note: httpx automatically handles async here if needed # JSONを整形して文字列化 json_string = json.dumps(json_content, indent=2, ensure_ascii=False) return FetchResponse( content=[{"type": "text", "text": json_string}], isError=False ) except json.JSONDecodeError as e: return FetchResponse( content=[], isError=True, errorMessage=f"Failed to decode JSON from {payload.url}: {e}", ) except Exception as e: return FetchResponse(content=[], isError=True, errorMessage=str(e)) @staticmethod async def txt(payload: FetchRequestArgs) -> FetchResponse: """Fetches content and returns plain text.""" try: response = await Fetcher._fetch(payload) html_content = ( await response.aread() ) # Read as bytes for bs4 encoding detection # BeautifulSoup can often detect encoding better soup = BeautifulSoup(html_content, "lxml") # Use lxml parser # Remove script and style elements for element in soup(["script", "style"]): element.decompose() text = soup.get_text(separator=" ", strip=True) # Normalize whitespace # normalized_text = ' '.join(text.split()) return FetchResponse( content=[{"type": "text", "text": text}], isError=False ) except Exception as e: return FetchResponse(content=[], isError=True, errorMessage=str(e)) @staticmethod async def markdown(payload: FetchRequestArgs) -> FetchResponse: """Fetches content and converts it to Markdown.""" try: response = await Fetcher._fetch(payload) html_content = await response.aread() # Decode carefully before passing to markdownify try: html_text = html_content.decode("utf-8") except UnicodeDecodeError: detected_encoding = response.encoding or "iso-8859-1" html_text = html_content.decode(detected_encoding, errors="replace") # Use custom NoImagesConverter to ignore images converter = NoImagesConverter() md = converter.convert(html_text) return FetchResponse(content=[{"type": "text", "text": md}], isError=False) except Exception as e: return FetchResponse(content=[], isError=True, errorMessage=str(e))

Loading blob content...

Implementation Reference

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Jij-Inc/Jij-MCP-Server'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

fetcher.py•5.77 KiB