LinkedIn MCP Server

dump_snapshots.py•2.79 KiB

"""Dump LinkedIn scraper output as timestamped local snapshots. Uses the same code paths as production (parse_person_sections / parse_company_sections). Run: uv run python scripts/dump_snapshots.py """ import asyncio import json import sys from datetime import datetime from pathlib import Path # Add project root to path sys.path.insert(0, str(Path(__file__).parent.parent)) from linkedin_mcp_server.drivers.browser import ( close_browser, ensure_authenticated, get_or_create_browser, set_headless, ) from linkedin_mcp_server.scraping import ( LinkedInExtractor, parse_company_sections, parse_person_sections, ) OUTPUT_DIR = Path(__file__).parent / "snapshot_dumps" # Targets using the same section strings as prod tool calls PERSON_TARGETS: list[tuple[str, str]] = [ ("williamhgates", "experience,education,interests,honors,languages,contact_info"), ("anistji", "experience,education,honors,languages,contact_info"), ] COMPANY_TARGETS: list[tuple[str, str]] = [ ("anthropicresearch", "posts,jobs"), ] async def main(): timestamp = datetime.now().strftime("%Y%m%d_%H%M%S") run_dir = OUTPUT_DIR / timestamp run_dir.mkdir(parents=True, exist_ok=True) set_headless(True) try: await ensure_authenticated() browser = await get_or_create_browser() extractor = LinkedInExtractor(browser.page) for username, sections_str in PERSON_TARGETS: print(f"\n--- Scraping person: {username} (sections: {sections_str}) ---") fields, _ = parse_person_sections(sections_str) result = await extractor.scrape_person(username, fields) dump_path = run_dir / f"person_{username}.json" dump_path.write_text(json.dumps(result, indent=2, ensure_ascii=False)) for section_name, text in result["sections"].items(): txt_path = run_dir / f"person_{username}_{section_name}.txt" txt_path.write_text(text) print(f" {section_name}: {len(text)} chars") for company, sections_str in COMPANY_TARGETS: print(f"\n--- Scraping company: {company} (sections: {sections_str}) ---") fields, _ = parse_company_sections(sections_str) result = await extractor.scrape_company(company, fields) dump_path = run_dir / f"company_{company}.json" dump_path.write_text(json.dumps(result, indent=2, ensure_ascii=False)) for section_name, text in result["sections"].items(): txt_path = run_dir / f"company_{company}_{section_name}.txt" txt_path.write_text(text) print(f" {section_name}: {len(text)} chars") finally: await close_browser() print(f"\n✅ Snapshots saved to {run_dir}/") if __name__ == "__main__": asyncio.run(main())

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/stickerdaniel/linkedin-mcp-server'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

dump_snapshots.py•2.79 KiB