Zotero MCP Server

Apache 2.0
OverviewInspectSchema Related Servers Reviews Score
zotero_mcp
#!/usr/bin/env python3
"""MCP server implementation for Zotero integration."""

import json
import logging
import os
from typing import Any, Dict, List, Optional
from pathlib import Path
from dotenv import load_dotenv
load_dotenv()

from fastmcp import FastMCP, Context
from pyzotero import zotero
from anthropic import Anthropic
from pypdf import PdfReader
from io import BytesIO
import tempfile
import zipfile

logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

TODO_TAG_NAME = "todo"
SUMMARIZED_TAG_NAME = "summarized"
ERROR_TAG_NAME = "error"
DENY_TAG_NAME = "deny"

mcp = FastMCP(
    "zotero-mcp-server",
    version="0.1.0",
    capabilities={"tools": True}
)

try:
    zot = zotero.Zotero(
        os.environ['ZOTERO_USER_ID'],
        "user",
        os.environ['ZOTERO_API_KEY'],
        local=True  # use local Zotero library instead of making network calls
    )
    # test the connection
    zot.items(limit=1)
except Exception as e:
    if "Local API is not enabled" in str(e):
        logger.error("Zotero local API is not enabled. Please enable it in Zotero Preferences -> Advanced -> Allow other applications on this computer to communicate with Zotero.")
        exit(1)
    else:
        logger.error(f"Error connecting to Zotero: {e}")
        exit(1)

anthropic = Anthropic(api_key=os.environ.get('ANTHROPIC_API_KEY', '')) # Remove proxies parameter

@mcp.tool()
def search_papers(tags: List[str] = None, query: str = None) -> dict:
    """Search through Zotero papers based on tags and/or text.
    
    Args:
        tags: List of tags to filter by
        query: Search query to filter by title and creator fields
    """
    try:
        if tags and query:
            # If both tags and query are provided, first search by query then filter by tags
            items = zot.items(q=query)
            # Filter for tags client-side
            items = [item for item in items 
                    if all(tag in [t['tag'] for t in item['data'].get('tags', [])] 
                    for tag in tags)]
        elif tags:
            # use a single tag for now since the API handles multiple tags differently
            items = zot.items(tag=tags[0]) if len(tags) == 1 else zot.items()
            # filter for multiple tags client-side if needed
            if len(tags) > 1:
                items = [item for item in items 
                        if all(tag in [t['tag'] for t in item['data'].get('tags', [])] 
                        for tag in tags)]
        elif query:
            # Search by query only
            items = zot.items(q=query)
        else:
            items = zot.items()

        # enhanced response with more useful information
        processed_items = []
        for item in items:
            # skip attachments and notes
            if item.get('data', {}).get('itemType') in ['attachment', 'note']:
                continue
                
            item_data = item.get('data', {})
            processed_item = {
                'key': item.get('key'),
                'title': item_data.get('title', 'Unknown Title'),
                'authors': item_data.get('creators', []),
                'year': item_data.get('date', '').split('-')[0] if item_data.get('date') else None,
                'tags': [t.get('tag') for t in item_data.get('tags', [])],
                'abstract': item_data.get('abstractNote'),
                'url': item_data.get('url'),
                'item_type': item_data.get('itemType'),
                'raw_data': item  # Include raw data for complete access 
            }
            processed_items.append(processed_item)

        return {
            "status": "success", 
            "total_results": len(processed_items),
            "items": processed_items
        }
    except Exception as e:
        logger.error(f"Error searching papers: {str(e)}")
        return {"status": "error", "message": str(e)}

@mcp.tool()
def get_paper_notes(item_key: str) -> Dict[str, Any]:
    """Get all notes attached to a specific paper."""
    try:
        notes = zot.children(item_key)
        return {
            "notes": [{
                "key": note["key"],
                "text": note["data"].get("note", ""),
                "tags": [tag["tag"] for tag in note["data"].get("tags", [])]
            } for note in notes if note["data"].get("itemType") == "note"]
        }
    except Exception as e:
        logger.error(f"Error getting notes: {e}")
        raise ValueError(str(e))

@mcp.tool()
def get_paper(item_key: str) -> Dict[str, Any]:
    """Get details for a specific paper."""
    try:
        item = zot.item(item_key)
        if not item:
            return {"status": "error", "message": "Paper not found"}
            
        item_data = item.get('data', {})
        processed_item = {
            'key': item.get('key'),
            'title': item_data.get('title', 'Unknown Title'),
            'authors': item_data.get('creators', []),
            'year': item_data.get('date', '').split('-')[0] if item_data.get('date') else None,
            'tags': [t.get('tag') for t in item_data.get('tags', [])],
            'abstract': item_data.get('abstractNote'),
            'url': item_data.get('url'),
            'item_type': item_data.get('itemType'),
            'raw_data': item
        }
        return {"status": "success", "item": processed_item}
    except Exception as e:
        logger.error(f"Error getting paper: {str(e)}")
        return {"status": "error", "message": str(e)}

@mcp.tool()
def add_note(item_key: str, note_text: str, tags: List[str] = None) -> dict:
    """Add a note to a specific paper."""
    try:
        # verify the paper exists first
        paper = get_paper(item_key)
        if paper.get("status") == "error":
            return paper
        
        # create the note
        template = {
            'itemType': 'note',
            'parentItem': item_key,
            'note': note_text,
            'tags': [{'tag': tag} for tag in (tags or [])]
        }
        
        result = zot.create_items([template])
        note_key = result.get("successful", {}).get("0", {}).get("key")
        
        return {
            "status": "success",
            "note_key": note_key,
            "paper_title": paper["item"]["title"]
        }
    except Exception as e:
        logger.error(f"Error adding note: {str(e)}")
        return {"status": "error", "message": str(e)}

@mcp.tool()
def get_pdf_content(item_key: str) -> dict:
    """Get the PDF content for a given item.
    
    Args:
        item_key: The Zotero item key
    """
    try:
        # First get the item to find its attachments
        item = zot.item(item_key)
        
        # Look for PDF attachment in the links
        if 'attachment' in item['links'] and item['links']['attachment']['attachmentType'] == 'application/pdf':
            attachment_key = item['links']['attachment']['href'].split('/')[-1]
            # Get the PDF content
            pdf_content = zot.file(attachment_key)
            return {
                'success': True,
                'content': pdf_content,
                'attachment_key': attachment_key
            }
        
        # If not found in links, check children
        children = zot.children(item_key)
        for child in children:
            if child['data'].get('itemType') == 'attachment' and child['data'].get('contentType') == 'application/pdf':
                pdf_content = zot.file(child['key'])
                return {
                    'success': True,
                    'content': pdf_content,
                    'attachment_key': child['key']
                }
        
        return {
            'success': False,
            'error': 'No PDF attachment found for this item'
        }
        
    except Exception as e:
        logger.error(f"Error getting PDF content: {e}")
        return {
            'success': False,
            'error': str(e)
        }

@mcp.tool()
def request_summary(item_key: str) -> Dict[str, Any]:
    """Request a summary for a paper."""
    try:
        # add TODO tag to trigger summarization
        item = zot.item(item_key)
        tags = item["data"]["tags"]
        if not any(tag["tag"] == TODO_TAG_NAME for tag in tags):
            tags.append({"tag": TODO_TAG_NAME})
            item["data"]["tags"] = tags
            zot.update_item(item)
        return {"status": "success", "message": "Summary requested"}
    except Exception as e:
        logger.error(f"Error requesting summary: {e}")
        raise ValueError(str(e))

if __name__ == "__main__":
    # local testing
    load_dotenv()
    
    required_env_vars = ['ZOTERO_USER_ID']
    missing_vars = [var for var in required_env_vars if not os.getenv(var)]
    
    if missing_vars:
        logger.error(f"Missing required environment variables: {', '.join(missing_vars)}")
        logger.error("Please ensure these are set in your .env file")
        exit(1)
        
    mcp.run()