Petamind MCP

petamind-mcp
src
titan_factory

exporter.py•18.3 kB

"""Exporter module - exports training data to JSONL format.""" import hashlib import json import random import re from pathlib import Path import aiosqlite from titan_factory.config import Config from titan_factory.schema import Candidate, GeneratedFile, JudgeScore, TeacherModel, UISpec from titan_factory.utils import ensure_dir, log_info, log_success # === Chat Template === # Keep the exported assistant message strict and consistent: # - A <think> block (either from the teacher model, or a deterministic fallback) # - A single JSON object matching TrainingOutput: {"ui_spec": ..., "files": [...]} SYSTEM_MESSAGE = """You are Titan 4 Design, a UI generation expert. First, analyze the request in <think> tags - consider the brand, layout, sections, and implementation approach. Then output valid JSON with your ui_spec and generated files. Rules: - No markdown. No code fences. - No extra text before <think> or after the final }. - Use Next.js App Router + TypeScript + Tailwind CSS. No UI libraries. Output format: <think>...</think> {"ui_spec": {...}, "files": [{"path":"app/page.tsx","content":"..."}]}""" _THINK_BLOCK_RE = re.compile(r"<think>(?P<think>[\s\S]*?)</think>", re.IGNORECASE) _CODE_OLD_BLOCK_RE = re.compile(r"<CODE_OLD>[\s\S]*?</CODE_OLD>", re.IGNORECASE) def _extract_think_block(raw_response: str) -> str | None: """Extract a <think>...</think> block from a raw model response. We prefer preserving teacher reasoning verbatim (when present), but we only export the think block + validated JSON payload for schema consistency. Args: raw_response: Full raw model response Returns: A complete <think>...</think> string, or None if not found. """ match = _THINK_BLOCK_RE.search(raw_response or "") if not match: return None think = match.group("think").strip() if not think: return "<think></think>" # Hard cap to avoid runaway reasoning blobs bloating training tokens if len(think) > 4000: think = think[:4000].rstrip() + "\n[truncated]" return f"<think>\n{think}\n</think>" def _fallback_think(ui_spec: UISpec, is_edit: bool) -> str: """Deterministically synthesize a short <think> block from the UI_SPEC. Some teacher models occasionally omit <think>. We still want the exported dataset to have consistent reasoning structure. This fallback is derived only from the already-validated UI_SPEC (no hidden chain-of-thought). """ brand = ui_spec.brand content = ui_spec.content sections = [s.id for s in ui_spec.layout.sections][:8] page_type = ui_spec.page_type page_type_value = page_type.value if hasattr(page_type, "value") else str(page_type) mode = "edit/refactor" if is_edit else page_type_value lines = [ f"Goal: {mode} UI for {content.business_name} in {content.city}.", f"Brand: {brand.mood} mood with {brand.accent} accent; {', '.join(brand.style_keywords[:3])}.", f"Layout: sections={sections}.", "Implementation: Next.js App Router + TS + Tailwind; no UI libs; keep code compact and accessible.", ] return "<think>\n" + "\n".join(lines) + "\n</think>" def format_training_example( task_prompt: str, ui_spec: UISpec, files: list[GeneratedFile], raw_response: str | None = None, is_edit: bool = False, code_old: str | None = None, ) -> dict: """Format a training example in chat format. Args: task_prompt: Original task prompt ui_spec: UI specification files: Generated files raw_response: Full model response including <think> blocks (preferred) is_edit: Whether this is an edit task code_old: Original code for edit tasks Returns: Training example dict """ # Build user message if is_edit and code_old: # If the prompt already contains a CODE_OLD block (older runs / manual prompts), # replace its content to avoid duplication and ensure correct code_old. if "<CODE_OLD>" in task_prompt and "</CODE_OLD>" in task_prompt: user_content = _CODE_OLD_BLOCK_RE.sub( f"<CODE_OLD>\n{code_old}\n</CODE_OLD>", task_prompt, ) else: user_content = f"{task_prompt}\n\n<CODE_OLD>\n{code_old}\n</CODE_OLD>" else: user_content = task_prompt # Always export a strict TrainingOutput JSON payload for schema consistency. # If a teacher response is available, preserve its <think> block for reasoning training. assistant_response = { "ui_spec": ui_spec.model_dump(), "files": [f.model_dump() for f in files], } think_block = _extract_think_block(raw_response or "") if think_block is None: think_block = _fallback_think(ui_spec, is_edit=is_edit) assistant_content = ( think_block + "\n" + json.dumps(assistant_response, ensure_ascii=False, separators=(",", ":")) ) return { "messages": [ {"role": "system", "content": SYSTEM_MESSAGE}, {"role": "user", "content": user_content}, {"role": "assistant", "content": assistant_content}, ] } def _compute_publishable_from_db( publishable_flag: bool, planner_model_json: str | None, patcher_models_json: str | None, ) -> bool: """Compute publishable status from DB fields. Uses the full teacher chain to determine if candidate is publishable. A candidate is only publishable if ALL models in the chain are publishable. Args: publishable_flag: The generator's publishable flag planner_model_json: JSON string of planner TeacherModel patcher_models_json: JSON string of patcher TeacherModel list Returns: True if all models in chain are publishable """ if not publishable_flag: return False # Check planner if planner_model_json: try: planner_data = json.loads(planner_model_json) if not planner_data.get("publishable", True): return False except (json.JSONDecodeError, KeyError): pass # Check all patchers if patcher_models_json: try: patchers = json.loads(patcher_models_json) for patcher in patchers: if not patcher.get("publishable", True): return False except (json.JSONDecodeError, KeyError): pass return True async def load_candidates_from_manifest(manifest_path: Path) -> list[dict]: """Load selected/accepted candidates from manifest database. Args: manifest_path: Path to manifest.db Returns: List of candidate records with task info including original prompt """ async with aiosqlite.connect(manifest_path) as conn: # Get candidates marked selected/accepted, including original prompt and teacher chain cursor = await conn.execute(""" SELECT t.id as task_id, t.niche_id, t.page_type, t.prompt, t.is_edit, t.code_old, t.ui_spec, c.id as candidate_id, c.files, c.score, c.publishable, c.planner_model, c.patcher_models, c.raw_generator_response FROM candidates c JOIN tasks t ON c.task_id = t.id WHERE c.status IN ('selected', 'accepted') """) records = [] async for row in cursor: # Compute publishable from full teacher chain publishable = _compute_publishable_from_db( publishable_flag=bool(row[10]), planner_model_json=row[11], patcher_models_json=row[12], ) records.append({ "task_id": row[0], "niche_id": row[1], "page_type": row[2], "prompt": row[3], # Original prompt stored in DB "is_edit": bool(row[4]), # Stored is_edit flag "code_old": row[5], # Stored code_old for edits "ui_spec": json.loads(row[6]) if row[6] else None, "candidate_id": row[7], "files": json.loads(row[8]) if row[8] else [], "score": row[9], "publishable": publishable, # Computed from full teacher chain "raw_generator_response": row[13], # Full response with <think> for training }) return records def split_records( records: list[dict], config: Config, ) -> tuple[list[dict], list[dict], list[dict]]: """Split records into train, validation, and holdout sets. Args: records: All records config: Configuration with split settings Returns: Tuple of (train, validation, holdout) record lists """ # Determine holdout niches all_niches = list(set(r["niche_id"] for r in records)) random.shuffle(all_niches) if config.export.holdout_niche_ids: holdout_niches = set(config.export.holdout_niche_ids) else: holdout_count = config.export.holdout_niches holdout_niches = set(all_niches[:holdout_count]) log_info(f"Holding out {len(holdout_niches)} niches for generalization testing") # Split by niche holdout = [r for r in records if r["niche_id"] in holdout_niches] remaining = [r for r in records if r["niche_id"] not in holdout_niches] # Random validation split within remaining random.shuffle(remaining) val_count = int(len(remaining) * config.export.validation_split) validation = remaining[:val_count] train = remaining[val_count:] log_info(f"Split: {len(train)} train, {len(validation)} validation, {len(holdout)} holdout") return train, validation, holdout async def export_run( run_dir: Path, config: Config, *, min_score: float | None = None, ) -> None: """Export a run's results to training format. Creates both public/ and private/ exports. Args: run_dir: Run output directory config: Configuration min_score: Optional minimum score filter for exported winners """ manifest_path = run_dir / "manifest.db" if not manifest_path.exists(): raise FileNotFoundError(f"Manifest not found: {manifest_path}") # Load all selected/accepted candidates records = await load_candidates_from_manifest(manifest_path) log_info(f"Loaded {len(records)} selected/accepted candidates") if not records: log_info("No records to export") return if min_score is not None: before = len(records) records = [ r for r in records if r.get("score") is not None and float(r["score"]) >= float(min_score) ] log_info(f"Filtered to {len(records)}/{before} records with score >= {min_score:.1f}") if not records: log_info("No records met the minimum score filter; nothing to export") return # Write rich records (all candidates for audit) suffix = f"_min{min_score:.1f}".replace(".", "_") if min_score is not None else "" rich_path = run_dir / f"rich_records{suffix}.jsonl" with open(rich_path, "w") as f: for record in records: f.write(json.dumps(record) + "\n") log_info(f"Wrote {len(records)} rich records to {rich_path}") # Export public (publishable only) public_records = [r for r in records if r["publishable"]] if public_records: await _export_track( public_records, run_dir / f"public{suffix}", config, f"public{suffix}", ) # Export private (all) await _export_track( records, run_dir / f"private{suffix}", config, f"private{suffix}", ) async def _export_track( records: list[dict], output_dir: Path, config: Config, track_name: str, ) -> None: """Export a single track (public or private). Args: records: Records to export output_dir: Output directory config: Configuration track_name: Track name for logging """ ensure_dir(output_dir) # Split into train/val/holdout train, validation, holdout = split_records(records, config) # Write train.jsonl train_path = output_dir / "train.jsonl" _write_training_jsonl(train, train_path) # Write valid.jsonl valid_path = output_dir / "valid.jsonl" _write_training_jsonl(validation, valid_path) # Write holdout.jsonl (for later evaluation) holdout_path = output_dir / "holdout.jsonl" _write_training_jsonl(holdout, holdout_path) log_success( f"Exported {track_name}: " f"{len(train)} train, {len(validation)} valid, {len(holdout)} holdout" ) def _write_training_jsonl(records: list[dict], path: Path) -> None: """Write records to training JSONL format. Uses the original stored prompt rather than reconstructing it. This ensures training data matches what was actually generated. Args: records: Records to write path: Output path """ with open(path, "w") as f: for record in records: if not record["ui_spec"] or not record["files"]: continue # Reconstruct objects ui_spec = UISpec.model_validate(record["ui_spec"]) files = [GeneratedFile.model_validate(f) for f in record["files"]] # Use stored prompt and edit info (not reconstructed!) task_prompt = record.get("prompt") is_edit = record.get("is_edit", False) code_old = record.get("code_old") # Fallback to reconstruction only if prompt wasn't stored # (for backwards compatibility with older manifests) if not task_prompt: task_prompt = _reconstruct_prompt(record, ui_spec) # Get raw response (includes <think> blocks for training reasoning) raw_response = record.get("raw_generator_response") # Format training example example = format_training_example( task_prompt=task_prompt, ui_spec=ui_spec, files=files, raw_response=raw_response, is_edit=is_edit, code_old=code_old if is_edit else None, ) f.write(json.dumps(example) + "\n") def _reconstruct_prompt(record: dict, ui_spec: UISpec) -> str: """Reconstruct a task prompt from the UI spec. Args: record: Record dict ui_spec: UI specification Returns: Reconstructed prompt """ # Build a prompt that matches the style of the original page_type = record["page_type"] brand = ui_spec.brand content = ui_spec.content if page_type == "landing": return f"""Create a {brand.mood} themed landing page for {content.business_name}, a {ui_spec.niche.vertical.replace("_", " ")} in {content.city}. Style: {", ".join(brand.style_keywords)}, {brand.accent} accent CTA: "{ui_spec.cta.primary}" {content.offer}. Target audience: {content.audience}. Make it premium with: {", ".join(content.highlights[:3])}. No UI libraries.""" elif page_type == "directory_home": return f"""Create a {brand.mood} directory homepage for finding {ui_spec.niche.vertical.replace("_", " ")} services. Style: {", ".join(brand.style_keywords)}, {brand.accent} accent Include search, filters, and listing grid. No UI libraries.""" elif page_type in ("city_index", "category_index"): return f"""Create a {brand.mood} {page_type.replace("_", " ")} page for {ui_spec.niche.vertical.replace("_", " ")} in {content.city}. Style: {", ".join(brand.style_keywords)}, {brand.accent} accent Include filterable listings grid and local info. No UI libraries.""" elif page_type == "listing_profile": return f"""Create a {brand.mood} listing detail page for {content.business_name}. Style: {", ".join(brand.style_keywords)}, {brand.accent} accent CTA: "{ui_spec.cta.primary}" Include gallery, info, services, reviews, and contact. No UI libraries.""" elif page_type == "admin_dashboard": return f"""Create a {brand.mood} admin dashboard for managing a {ui_spec.niche.vertical.replace("_", " ")} business. Style: {", ".join(brand.style_keywords)}, {brand.accent} accent Include stats, activity table, and charts. No UI libraries.""" else: return f"""Create a {page_type} page for {content.business_name}. Style: {brand.mood}, {", ".join(brand.style_keywords)}, {brand.accent} accent No UI libraries.""" async def export_stats(run_dir: Path) -> dict: """Get statistics for a run. Args: run_dir: Run directory Returns: Stats dictionary """ manifest_path = run_dir / "manifest.db" if not manifest_path.exists(): return {"error": "Manifest not found"} async with aiosqlite.connect(manifest_path) as conn: # Task counts by status cursor = await conn.execute( "SELECT status, COUNT(*) FROM tasks GROUP BY status" ) task_stats = dict(await cursor.fetchall()) # Candidate counts by status cursor = await conn.execute( "SELECT status, COUNT(*) FROM candidates GROUP BY status" ) candidate_stats = dict(await cursor.fetchall()) # Average score of selected/accepted cursor = await conn.execute( "SELECT AVG(score) FROM candidates WHERE status IN ('selected', 'accepted')" ) avg_score = (await cursor.fetchone())[0] # Selected/accepted by model cursor = await conn.execute( "SELECT generator_model, COUNT(*) FROM candidates WHERE status IN ('selected', 'accepted') GROUP BY generator_model" ) winners_by_model = dict(await cursor.fetchall()) return { "tasks": task_stats, "candidates": candidate_stats, "avg_winner_score": round(avg_score, 2) if avg_score else 0, "winners_by_model": winners_by_model, }

Loading blob content...

Latest Blog Posts

Don't Use Large Strings as Cache Keys
By punkpeye on January 11, 2026.
markdown
node-js
cache
What are Claude Skills?
By punkpeye on January 10, 2026.
mcp
skills
How to Test MCP Streamable HTTP Endpoints Using cURL
By punkpeye on January 2, 2026.
tutorial
bash

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/alexalexalex222/petamind-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

exporter.py•18.3 kB