Map Traveler MCP

Overview Schema Related Servers Score Discussions

map-traveler-mcp
src

ImageService.ts•50.5 KiB

/*! map-traveler-mcp | MIT License | https://github.com/mfukushim/map-traveler-mcp */ import {Effect, Schedule, Option, Schema} from "effect"; import sharp = require("sharp"); import {HttpClient, HttpClientRequest, HttpClientResponse} from "@effect/platform"; import dayjs from "dayjs"; import {Jimp} from "jimp"; import {PixAIClient} from '@pixai-art/client' import {type MediaBaseFragment, TaskBaseFragment} from "@pixai-art/client/types/generated/graphql.js"; import 'dotenv/config' import {logSync, McpLogService} from "./McpLogService.js"; import { __pwd, DbService, } from "./DbService.js"; import WebSocket from 'ws' import * as path from "path"; import * as os from "node:os"; import * as fs from "node:fs"; import {execSync} from "node:child_process"; import {defaultAvatarId} from "./RunnerService.js"; import {ImageMethod, Mode, TravelerEnv} from "./EnvUtils.js"; import {GeminiImageGenerator} from "./Generators/GeminiGenerator.js"; import FormData from "form-data"; import {TimeoutException} from "effect/Cause"; import {fileURLToPath} from "url"; export const defaultBaseCharPrompt = 'depth of field, cinematic composition, masterpiece, best quality,looking at viewer,(solo:1.1),(1 girl:1.1),loli,school uniform,blue skirt,long socks,black pixie cut' export const defaultBaseCharPromptV4 = 'a Girl is school uniform,blue skirt,long socks,black pixie cut' const defaultPixAiModelId = '1648918127446573124'; export class ImageService extends Effect.Service<ImageService>()("traveler/ImageService", { accessors: true, effect: Effect.gen(function* () { let recentImage: Buffer | undefined // 直近の1生成画像を保持する snsのpostに自動引用する const getImageOutSize = () => { return DbService.getSysEnv().pipe(Effect.andThen(runnerEnv => { const widthOut = Number.parseInt(runnerEnv.image_width || "512") || 512; const heightOut = Math.floor(widthOut * 0.75); return {widthOut, heightOut} })) } const regDel = /$(.+):.+$/ const getBasePrompt = (avatarId: number) => { return Effect.gen(function* () { const runnerEnv = yield* DbService.getSysEnv() if (runnerEnv.fixed_model_prompt) { return runnerEnv.fixed_model_prompt } return yield* DbService.getAvatarModel(avatarId).pipe( Effect.andThen(a => { // geminiの場合 (word:n.n)様式の指定値はエラーになりやすいのでdbに入っていたら強制除去する if (runnerEnv.useAiImageGen === 'gemini') { return a.baseCharPrompt.split(',').map(v => { const s = v.replace(regDel, '$1') if (s.includes('masterpiece') || s.includes('best quality') || s.includes('loli') || s.includes('looking at viewer')|| s.includes('depth of field')|| s.includes('cinematic composition')) { return [] } return [s] }).flat().join(',')+ ',anime' } return a.baseCharPrompt + ',anime'; }), Effect.orElseSucceed(() => { if (runnerEnv.useAiImageGen === 'gemini') { return defaultBaseCharPromptV4 } return defaultBaseCharPrompt; })); }) } // TODO notifications/progress を発行すべき const progress = (total = 1, progress = 0, env: Mode) => { logSync('progress:', env.progressToken, total, progress) if (env.progressToken === undefined) { return Effect.void } return Effect.void // return McpService.sendProgressNotification(env.progressToken || '', total, progress).pipe( // Effect.repeat(Schedule.repeatForever.pipe(Schedule.intersect(Schedule.spaced("15 seconds")))), // ); } function sdMakeTextToImage(prompt: string, runnerEnv: TravelerEnv, opt?: { width?: number, height?: number, sampler?: string, samples?: number, steps?: number, cfg_scale?: number }) { return Effect.gen(function* () { const param = prompt.split(',').reduce((p, c) => { const match = c.trim().match(/$(\w+):([0-9.]+)$/) if (match) { p.list.push({text: p.buf, weight: 1}) p.list.push({text: match[1].trim(), weight: Number.parseFloat(match[2])}) return p } else { return {buf: p.buf ? `${p.buf},${c}` : c, list: p.list} } }, {list: [] as { text: string, weight: number }[], buf: ''}); if (param.buf) { param.list.push({text: param.buf, weight: 1}) } // yield* McpLogService.logTrace(`sdMakeTextToImage:${JSON.stringify(param.list)}`); if (param.list.length > 10) { return yield* Effect.fail(new Error('param weight too long')) } const sdKey: string = runnerEnv.sd_key || '' const client = yield* HttpClient.HttpClient; return yield* HttpClientRequest.post(`https://api.stability.ai/v1/generation/stable-diffusion-xl-1024-v1-0/text-to-image`).pipe( HttpClientRequest.setHeaders({ Authorization: `Bearer ${sdKey}`, Accept: "application/json", }), HttpClientRequest.bodyJson({ cfg_scale: opt?.cfg_scale || 7, height: opt?.height || 1024, width: opt?.width || 1024, sampler: opt?.sampler || "K_DPM_2_ANCESTRAL", samples: opt?.samples || 1, steps: opt?.steps || 30, text_prompts: param.list }), Effect.flatMap(client.execute), Effect.flatMap(a => a.json), // Effect.tap(a => McpLogService.logTrace('sdMakeTextToImage:' + JSON.stringify(a).slice(0, 200))), Effect.andThen(a => a as { artifacts: { base64: string, finishReason: string, seed: number }[] }), Effect.flatMap(a => { if (!a.artifacts || a.artifacts.length === 0 || a.artifacts.some(b => b.finishReason !== 'SUCCESS')) { return Effect.fail(new Error(`fail sd:${opt?.width},${opt?.height},` + JSON.stringify(a))) } return Effect.tryPromise(() => sharp(Buffer.from(a.artifacts[0].base64, 'base64')).resize({ width: 512, height: 512 }).png().toBuffer()) }), Effect.retry(Schedule.recurs(1).pipe(Schedule.intersect(Schedule.spaced("5 seconds")))), Effect.mapError(e => new Error(`sdMakeTextToImage error:${e}`)), Effect.scoped, ) }) } function sdMakeImageToImage(prompt: string, runnerEnv: TravelerEnv, inImage: Buffer, opt?: { width?: number, height?: number, sampler?: string, samples?: number, steps?: number, cfg_scale?: number }) { const sdKey: string = runnerEnv.sd_key || '' return Effect.tryPromise(() => sharp(inImage).resize({ width: opt?.width || 1024, height: opt?.height || 1024 }).png().toBuffer()).pipe( Effect.andThen(a => Effect.tryPromise({ try: () => { const formData = new FormData() formData.append('init_image', a) formData.append('init_image_mode', 'IMAGE_STRENGTH') formData.append('image_strength', 0.35) formData.append('text_prompts[0][text]', prompt) formData.append('cfg_scale', 7) formData.append('samples', 1) formData.append('steps', 30) return fetch( `https://api.stability.ai/v1/generation/stable-diffusion-xl-1024-v1-0/image-to-image`, { method: 'POST', headers: { ...formData.getHeaders(), Accept: 'application/json', Authorization: `Bearer ${sdKey}`, }, // @ts-ignore body: formData.getBuffer(), } ) }, catch: error => new Error(`${error}`) })), Effect.andThen(a => a.json()), // Effect.tap(a => McpLogService.logTrace('sdMakeImageToImage:' + JSON.stringify(a).slice(0, 200))), Effect.andThen(a => a as { artifacts: { base64: string, finishReason: string, seed: number }[] }), Effect.flatMap(a => { if (!a.artifacts || a.artifacts.length === 0 || a.artifacts.some(b => b.finishReason !== 'SUCCESS')) { return Effect.fail(new Error(`fail sd:${opt?.width},${opt?.height},` + JSON.stringify(a))) } return Effect.succeed(Buffer.from(a.artifacts[0].base64, 'base64')) }), ) } function sdMakeImage(prompt: string, runnerEnv: TravelerEnv, inImage?: Buffer, opt?: { width?: number, height?: number, sampler?: string, samples?: number, steps?: number, cfg_scale?: number, }) { const sdKey: string = runnerEnv.sd_key || '' if (!sdKey) { return Effect.fail(new Error('no key')) } return inImage ? sdMakeImageToImage(prompt, runnerEnv, inImage, opt) : sdMakeTextToImage(prompt, runnerEnv, opt); } function pixAiMakeImage(prompt: string, runnerEnv: TravelerEnv, inImage?: Buffer, opt?: { width?: number, height?: number, sampler?: string, samples?: number, steps?: number, cfg_scale?: number, }) { if (!runnerEnv.pixAi_key) { return Effect.fail(new Error('no key')) } const pixAiClient = new PixAIClient({ apiKey: runnerEnv.pixAi_key || '', webSocketImpl: WebSocket }) return Effect.retry( Effect.gen(function* () { let mediaId if (inImage) { const buf = new ArrayBuffer(inImage.byteLength); new Uint8Array(buf).set(new Uint8Array(inImage)); const blob = new Blob([buf], {type: 'image/jpeg'}); const file = new File([blob], "image.jpg", {type: 'image/jpeg'}) mediaId = yield* Effect.tryPromise({ try: () => pixAiClient.uploadMedia(file), catch: error => new Error(`uploadMedia fail:${error}`) }).pipe(Effect.andThen(a1 => { return !a1.mediaId ? Effect.fail(new Error(`uploadMedia fail`)) : Effect.succeed(a1.mediaId); })) } return mediaId }).pipe( // Effect.tap(a => McpLogService.logTrace(`uploadMedia ${a}`)), // Effect.tapError(a => McpLogService.logError(`uploadMedia error ${a}`)), Effect.andThen(a => { const body = a ? { prompts: prompt, modelId: runnerEnv.pixAi_modelId || defaultPixAiModelId, width: opt?.width || 512, height: opt?.height || 512, mediaId: a } : { prompts: prompt, modelId: runnerEnv.pixAi_modelId || defaultPixAiModelId, width: opt?.width || 512, height: opt?.height || 512, } return Effect.tryPromise({ try: () => pixAiClient.generateImage(body, ), catch: error => new Error(`generateImage fail:${error}`) }).pipe(Effect.timeout('1 minute')) }), // Effect.tap(a => McpLogService.logTrace(`generateImage ${a.status}`)), Effect.tapError(a => McpLogService.logError(`generateImage ${a}`)), Effect.andThen(task => { return Effect.tryPromise({ try: () => pixAiClient.getMediaFromTask(task as TaskBaseFragment), catch: error => new Error(`getMediaFromTask fail:${error}`) }) }), Effect.tap(() => McpLogService.logTrace(`getMediaFromTask`)), Effect.andThen(media => { if (!media) return Effect.fail(new Error(`media fail1:${media}`)) if (Array.isArray(media)) return Effect.fail(new Error(`media fail2:${media}`)) return Effect.tryPromise({ try: () => pixAiClient.downloadMedia(media as MediaBaseFragment), catch: error => new Error(`downloadMedia fail:${error}`) }); }), Effect.andThen(a => Buffer.from(a)), Effect.tap(a => McpLogService.logTrace(`downloadMedia out:${a.length}`)), Effect.tapError(a => McpLogService.logError(`downloadMedia err:${a}`)), ), Schedule.recurs(4).pipe(Schedule.intersect(Schedule.spaced("10 seconds")))); } /** * ホテル画像 * @param selectGen * @param hour * @param append * @param localDebug */ function makeHotelPict(selectGen: ImageMethod | undefined, hour: number, append ?: string, localDebug = false) { return Effect.gen(function* () { const env = yield* DbService.getSysEnv() if (!selectGen || env.mode.isPractice) { // 画像生成AIがなければ固定ホテル画像を使う return yield* Effect.async<Buffer, Error>((resume) => fs.readFile(path.join(__pwd, 'assets/hotelPict.png'), (err, data) => { if (err) { resume(Effect.fail(err)) } resume(Effect.succeed(data)); })).pipe(Effect.andThen(a => Buffer.from(a))) } let avatarImage:Buffer|undefined let prompt = ''; let room = '' if (hour < 6 || hour >= 19) { room += 'hotel room,desk,drink,laptop computer,talking to computer,sitting,window,night,(pyjamas:1.3)' } else if (hour < 11) { room += 'hotel room,desk,drink,laptop computer,talking to computer,sitting,window,morning' } else if (hour < 16) { room += 'cafe terrace,outdoor dining table,outdoor bistro chair,drink,laptop computer,talking to computer,sitting,noon' } else { room += 'cafe terrace,outdoor dining table,outdoor bistro chair,drink,laptop computer,talking to computer,sitting,evening' } if (append) { room += `,${append}` } if (selectGen === 'gemini' && env.avatar_image_uri) { prompt = 'Using the provided image, create a realistic anime girl in ' + room avatarImage = yield *getAvatarTemplateImage(env.avatar_image_uri); } else { prompt = (yield* getBasePrompt(defaultAvatarId)) + room } const {widthOut, heightOut} = yield* getImageOutSize(); return yield* selectImageGenerator(selectGen, prompt,avatarImage).pipe( Effect.tap(a => { recentImage = a if (localDebug) { return Effect.async<void, Error>((resume) => fs.writeFile('tools/test/hotelPict.png', a, err => { if (err) { resume(Effect.fail(err)) } resume(Effect.void) })) } }), Effect.andThen(a => Effect.tryPromise(() => sharp(a).resize({ width: widthOut, height: heightOut }).png().toBuffer())) ) }) } /** * 船等の特殊ロケーション * @param selectGen * @param vehiclePrompt * @param timeZoneId * @param localDebug * @private */ function makeEtcTripImage(selectGen: ImageMethod, vehiclePrompt: string, timeZoneId: string, localDebug = false) { // 乗り物の旅行画像生成 // 画像保存 // 乗り物と緯度経度での日記生成 // 日記のブログ結合 // 日記のtwitterポストはするかどうするか // 開始と終了の位置をrunStatusから取り出す // 対応する会話イベントがあるかどうかを確認してログを抽出する return Effect.gen(function* () { // 設定日時に対応した画像を生成する const env = yield *DbService.getSysEnv() const appendPrompts: string[] = [] appendPrompts.push(vehiclePrompt) const now = dayjs() const hour = now.tz(timeZoneId).hour() if (hour < 6 || hour >= 19) { appendPrompts.push('night') } else if (hour < 11) { appendPrompts.push('morning') } else if (hour < 16) { appendPrompts.push('noon') } else { appendPrompts.push('evening') } const {widthOut, heightOut} = yield* getImageOutSize() const appendPrompt = appendPrompts.join(',') let avatarImage:Buffer|undefined let prompt = ''; if (selectGen === 'gemini' && env.avatar_image_uri) { prompt = 'Using the provided image, create a realistic anime girl in ' + appendPrompt avatarImage = yield *getAvatarTemplateImage(env.avatar_image_uri); } else { prompt = (yield* getBasePrompt(defaultAvatarId)) + appendPrompt } return yield* selectImageGenerator(selectGen, prompt,avatarImage).pipe( Effect.tap(a => { recentImage = a if (localDebug) { return Effect.async<void, Error>((resume) => fs.writeFile('tools/test/etcPict.png', a, err => { if (err) { resume(Effect.fail(err)) } resume(Effect.void) })) } }), Effect.andThen(a => Effect.tryPromise(() => sharp(a).resize({ width: widthOut, height: heightOut }).png().toBuffer())) ) }) } /** * 絵生成のpromptを生成する * @param baseCharPrompt * @param simple * @param withAbort * @private */ const generatePrompt = (baseCharPrompt: string, simple = false, withAbort = false) => { return Effect.gen(function* () { const backPrompt = (simple || withAbort) ? ',(simple background:1.2)' : ',road' // ここがキャラの基本スタイル const basePrompt = baseCharPrompt + backPrompt; const prompt: string[] = []; const bodyRnd = Math.random() const faceRnd = Math.random() const poseRnd = Math.random() if (simple || withAbort) { if (withAbort) { // 電話絵は上半身のみ prompt.push('(upper body:1.3)'); } else { // 簡易背景は上半身かカウボーイショット prompt.push(Math.random() < 0.3 ? '(upper body:1.3)' : '(cowboy shot:1.3)'); // 立ち絵背景は単調にならないようにfromを後ろと横を少し入れる(SDXLから精度が高くなったので単調化しやすい) const fromRnd = Math.random() if (fromRnd < 0.3) { prompt.push('from back') } else if (fromRnd < 0.4) { prompt.push('from side') } } } else { // 通常は全身、カウボーイショット、上半身の各種をやってみる if (bodyRnd < 0.3) { prompt.push('full body'); } else if (bodyRnd < 0.6) { prompt.push('cowboy shot'); } else { prompt.push('upper body'); } } if (withAbort) { prompt.push('surprised,(calling phone:1.2),(holding smartphone to ear:1.2)'); } else { if (faceRnd < 0.1) { prompt.push(':D'); } else if (faceRnd < 0.3) { prompt.push('smiling'); } else if (faceRnd < 0.4) { prompt.push('laughing'); } else if (faceRnd < 0.6) { prompt.push('surprised'); } else if (faceRnd < 0.8) { prompt.push('grin'); } // なしもある if (poseRnd < 0.2) { prompt.push('looking around'); } else if (poseRnd < 0.6) { prompt.push('walking,looking sky') } else if (poseRnd < 0.7) { prompt.push('jumping') } else { prompt.push('standing') // 立ちの場合に少しポーズを入れる const faceRnd = Math.random() if (faceRnd < 0.2) { prompt.push('(salute:1.3),posing,(tilt my head:1.2)') } else if (faceRnd < 0.5) { prompt.push('posing,(tilt my head:1.2)') } } } const ap = prompt.join(',') return {prompt: `${basePrompt},${ap}`, append: ap}; }) } /** * 絵生成のpromptを生成するV4 * @param baseCharPrompt * @param simple * @param withAbort * @private */ const generatePromptV4 = (baseCharPrompt: string, simple = false, withAbort = false) => { return Effect.gen(function* () { const backPrompt = (simple || withAbort) ? ',simple background' : ',road' // ここがキャラの基本スタイル const basePrompt = baseCharPrompt + backPrompt; const prompt: string[] = []; const faceRnd = Math.random() const poseRnd = Math.random() if (simple || withAbort) { if (withAbort) { // 電話絵は上半身のみ prompt.push('upper body'); } else { // 立ち絵背景は単調にならないようにfromを後ろと横を少し入れる(SDXLから精度が高くなったので単調化しやすい) const fromRnd = Math.random() if (fromRnd < 0.3) { prompt.push('from back') } else if (fromRnd < 0.4) { prompt.push('from side') } } } else { // 通常は全身、カウボーイショット、上半身の各種をやってみる // if (bodyRnd < 0.3) { // prompt.push('full body'); // } else if (bodyRnd < 0.6) { // prompt.push('cowboy shot'); // } else { // prompt.push('upper body'); // } } if (withAbort) { prompt.push('surprised,calling phone,holding smartphone to ear'); } else { if (faceRnd < 0.1) { prompt.push(':D'); } else if (faceRnd < 0.3) { prompt.push('smiling'); } else if (faceRnd < 0.4) { prompt.push('laughing'); } else if (faceRnd < 0.6) { prompt.push('surprised'); } else if (faceRnd < 0.8) { prompt.push('grin'); } // なしもある if (poseRnd < 0.2) { prompt.push('looking around'); } else if (poseRnd < 0.6) { prompt.push('walking,looking sky') } else if (poseRnd < 0.7) { prompt.push('jumping') } else { prompt.push('standing') // 立ちの場合に少しポーズを入れる const faceRnd = Math.random() if (faceRnd < 0.2) { prompt.push('salute,posing,tilt my head') } else if (faceRnd < 0.5) { prompt.push('posing,tilt my head') } } } const ap = prompt.join(',') return {prompt: `${basePrompt},${ap}`, append: ap}; }) } const selectImageGenerator = (generatorId: ImageMethod, prompt: string, inImage?: Buffer, opt?: Record<string, any>) => { return Effect.gen(function* () { const runnerEnv = yield* DbService.getSysEnv() switch (generatorId) { case 'pixAi': return yield* pixAiMakeImage(prompt, runnerEnv, inImage, opt) case 'comfyUi': { const optList = runnerEnv.comfy_params ? runnerEnv.comfy_params.split(',').map(a => { const b = a.split('='); const val = b[1].includes("'") ? b[1].replaceAll("'", "") : Number.parseFloat(b[1]) return [b[0], val] }) : [] const optC: Record<string, any> = {...Object.fromEntries(optList), ...opt} if (!optC.width) { optC.width = 1024 } if (!optC.height) { optC.height = 1024 } return yield* comfyApiMakeImage(prompt, inImage, optC); } case 'gemini': { return yield* geminiMakeImage(prompt, runnerEnv, inImage, opt) } default: return yield* sdMakeImage(prompt, runnerEnv, inImage, opt) } }) }; /** * 人物像の成功度を確認する * @param avatarImage * @param windowSize */ function checkPersonImage(avatarImage: Buffer, windowSize: { w: number; h: number }) { return Effect.gen(function* () { const image = yield* Effect.tryPromise(() => Jimp.read(avatarImage)); // アルファ領域のピクセル数をカウントと囲むサイズを抽出する let minX = Number.MAX_SAFE_INTEGER let minY = Number.MAX_SAFE_INTEGER let maxX = Number.MIN_SAFE_INTEGER let maxY = Number.MIN_SAFE_INTEGER let alphaCount = 0 image.scan(0, 0, image.width, image.height, (x, y, idx) => { const alpha = image.bitmap.data[idx + 3]; if (alpha > 127) { alphaCount++ minX = Math.min(minX, x) minY = Math.min(minY, y) maxX = Math.max(maxX, x) maxY = Math.max(maxY, y) } }) const alphaNum = {alphaCount, rect: {x: minX, y: minY, w: maxX - minX, h: maxY - minY}} const number = alphaNum.alphaCount / (windowSize.w * windowSize.h); return {alphaNum, number}; }) } const rembgCli = (sdImage: Buffer, env: TravelerEnv) => { return Effect.gen(function* () { // TODO EffectのCommandをうまく書けなかったのでnodejsの素で const tempPath = os.tmpdir() const tempIn = path.join(tempPath, `tr-${crypto.randomUUID()}.png`) const tempOut = path.join(tempPath, `tr-${crypto.randomUUID()}.png`) fs.writeFileSync(tempIn, sdImage) let rembgPath if (env.mode.rembgPath) { rembgPath = env.mode.rembgPath } else { yield* Effect.fail(new Error('rembgPath not set')) } yield* Effect.addFinalizer(() => McpLogService.logTrace(`rembg finalizer ${tempPath}`).pipe(Effect.andThen(() => { try { fs.unlinkSync(tempIn) } catch (e) { } try { fs.unlinkSync(tempOut) } catch (e) { } }))) try { execSync(`${rembgPath} i ${tempIn} ${tempOut}`) } catch (e) { yield* Effect.fail(new Error(`rembg fail ${e}`)) } return fs.readFileSync(tempOut); }).pipe(Effect.scoped) } const rembgService = (sdImage: Buffer, env: TravelerEnv) => { return Effect.gen(function* () { yield* McpLogService.logTrace('in rembgService') if (!env.mode.remBgUrl) { return yield* Effect.fail(new Error('no rembg url')) } return yield* Effect.tryPromise({ try: () => { const formData = new FormData() formData.append("file", sdImage, { filename: "input.png", // ファイル名を指定（必須） contentType: "image/png" // 適切な Content-Type を指定 }); return fetch(`${env.mode.remBgUrl}/api/remove`, { method: 'POST', headers: { ...formData.getHeaders(), }, // @ts-ignore body: formData.getBuffer(), } ) }, catch: error => new Error(`${error}`) }).pipe( Effect.scoped, Effect.andThen( a => Effect.tryPromise(() => a.arrayBuffer())), Effect.tap(a => McpLogService.logTrace('rembgService out:', a.byteLength, a.toString())), Effect.tap(a => { if (a && a.byteLength) { return Effect.succeed(a) } return Effect.fail(new Error()) }), Effect.tapError(e => McpLogService.logTrace('rembgService err:', JSON.stringify(e))), Effect.retry(Schedule.recurs(1).pipe(Schedule.intersect(Schedule.spaced("2 seconds")))), Effect.andThen(a => Buffer.from(a)) ) }) } const rembgApi = (sdImage: Buffer) => { return Effect.gen(function* () { yield* McpLogService.logTrace('in rembgApi') const runnerEnv = yield* DbService.getSysEnv() if (!runnerEnv.remBgWoKey) { return yield* Effect.fail(new Error('no rembg Wo key')) } const client = yield* HttpClient.HttpClient; return yield* HttpClientRequest.post(`https://api.withoutbg.com/v1.0/image-without-background-base64`).pipe( HttpClientRequest.setHeaders({ Accept: "application/json", "Content-Type": "application/json", "X-API-Key": runnerEnv.remBgWoKey, }), HttpClientRequest.bodyJson({ image_base64: sdImage.toString("base64"), }), Effect.flatMap(client.execute), Effect.flatMap(a => a.json), Effect.andThen((a: any) => { // TODO うまくSchema.decode出来なかったので雑にキャストする if (a.error) { return Effect.fail(new Error(`rembgApi error:${JSON.stringify(a.node_errors)}`)) } return Effect.succeed(a as { img_without_background_base64: string }) }), Effect.tapError(McpLogService.logError), Effect.retry(Schedule.recurs(1).pipe(Schedule.intersect(Schedule.spaced("5 seconds")))), Effect.scoped, Effect.andThen(a => Buffer.from(a.img_without_background_base64, "base64")) ) }) } const initRembgService = (env: TravelerEnv) => { return Effect.gen(function* () { yield* McpLogService.logTrace('initRembgService in') if (!env.mode.remBgUrl) { return yield* Effect.fail(new Error('no rembg url')) } const client = yield* HttpClient.HttpClient const req = HttpClientRequest.get(`${env.mode.remBgUrl}/api`) const response = yield* client.execute(req) return yield* response.text }).pipe( Effect.scoped, Effect.retry({times: 2}), Effect.tap(a => McpLogService.logTrace('initRembgService', a)), Effect.tapError(e => McpLogService.logTrace('initRembgService err:', e.toString())), Effect.andThen(() => ({})), Effect.orElseSucceed(() => ({})), // ここはrembgに1回励起をさせるだけなのでエラーにはしない ); } const isEnableRembg = (env: TravelerEnv) => { return env.mode.rembgPath || env.mode.remBgUrl || env.remBgWoKey } const rembg = (sdImage: Buffer, env: TravelerEnv) => { if (env.remBgUrl) { return rembgService(sdImage, env) } else if (env.remBgWoKey) { return rembgApi(sdImage) } return rembgCli(sdImage, env); } /** * 旅画像生成処理V3 * @param basePhoto * @param selectGen * @param withAbort * @param opt bodyAreaRatio アバター本体占有面積比率 0.042 以上, bodyHWRatio アバター縦横比率 2.3 以上,sideBias 貼り付け位置を左右に偏らせる,bodyWindowRatioW,bodyWindowRatioH アバター合成ウィンドウ比率 * @param localDebug */ function makeRunnerImageV3( basePhoto: Buffer, selectGen: ImageMethod, withAbort = false, opt: { sideBias?: boolean, bodyAreaRatio?: number,// = 0.042, bodyHWRatio?: number, // = 1.5, // 画像AIの精度が上がっているので2.3から少し減らす bodyWindowRatioW?: number, // = {w: 0.5, h: 0.75} bodyWindowRatioH?: number, } = {bodyAreaRatio: 0.042, bodyHWRatio: 1.5, bodyWindowRatioW: 0.5, bodyWindowRatioH: 0.75}, localDebug = false, ) { return Effect.gen(function* () { const env = yield* DbService.getSysEnv() const {widthOut, heightOut} = yield* getImageOutSize() if (!isEnableRembg(env)) { // rembg pathがない場合、画像合成しないままの画像を戻す return { buf: yield* Effect.tryPromise(() => sharp(basePhoto).resize({ width: widthOut, height: heightOut }).png().toBuffer()), shiftX: 0, shiftY: 0, fit: false, append: '' } } if (env.remBgUrl) { yield* initRembgService(env) // docker rembgは初回初期化がいる } const outSize = {w: 1600, h: 1000}; const innerSize = {w: 1600, h: 1600} // TODO sdではサイズ制限がきつかったんだ const windowSize = selectGen === 'sd' ? {w: 832, h: 1216} : { w: Math.floor((innerSize.w * (opt?.bodyWindowRatioW || 0.5)) / 64) * 64, h: Math.floor((innerSize.h * (opt?.bodyWindowRatioH || 0.75)) / 64) * 64 } // const windowSize = {w: 832, h: 1216} const sideBias = opt?.sideBias || false const cutPos = sideBias ? (Math.random() < 0.5 ? Math.random() * 0.3 : 0.7 + Math.random() * 0.3) : Math.random() const shiftX = Math.floor((innerSize.w - windowSize.w) * cutPos); // 0～1で均等にランダム切り出しだったはず const innerImage = yield* Effect.tryPromise(() => sharp(basePhoto).resize({ width: innerSize.w, height: innerSize.h, fit: "fill" }).toBuffer()); const clopImage = yield* Effect.tryPromise(() => sharp(innerImage).extract({ left: shiftX, top: innerSize.h - windowSize.h, width: windowSize.w, height: windowSize.h }).toBuffer()) if (localDebug) { fs.writeFileSync('tools/test/testOutInClop.png', clopImage) } /** 画像評価リトライ */ const retryMax = 3 let retry = retryMax // 5回リトライになってるな現在初期値7 最小値2(でないと画像できない) const fixedThreshold = 2 // バストショットに切り替える閾値 2,1の2回はバストショット生成を試みる let isFixedBody = false let appendPrompt: string | undefined const avatarImage = yield* Effect.gen(function* () { const baseCharPrompt = yield* getBasePrompt(defaultAvatarId) const {prompt, append} = yield* generatePrompt(baseCharPrompt, retry < fixedThreshold, withAbort) appendPrompt = append retry-- if (retry < fixedThreshold) { // 立ち絵 isFixedBody = true yield* McpLogService.logTrace(`bast shot:${retry}`) return yield* selectImageGenerator(selectGen, prompt, undefined, { width: windowSize.w, height: windowSize.h }) } else { // 画面i2i isFixedBody = false yield* McpLogService.logTrace(`i2i:${retry}`) return yield* selectImageGenerator(selectGen, prompt, clopImage, { width: windowSize.w, height: windowSize.h, logTotal: retryMax, logProgress: retryMax - retry }) } }).pipe( // Effect.andThen(a => Buffer.from(a, 'base64')), Effect.tap(sdImage => localDebug && fs.writeFileSync('tools/test/testOutGen.png', sdImage)), Effect.andThen(sdImage => rembg(sdImage, env)), Effect.tap(avatarImage => localDebug && fs.writeFileSync('tools/test/testOutRmBg.png', avatarImage)), // Effect.tap(avatarImage => { // if (runnerEnv.ServerLog && runnerEnv.ServerLog.includes('trace')) { // fs.writeFileSync(path.join(os.tmpdir(), `trd-${crypto.randomUUID()}.png`), avatarImage, {flag: "w"}); // } // }), Effect.tap(avatarImage => { // 非透明度判定 0.02以上 const bodyAreaRatio = opt?.bodyAreaRatio || 0.042 const bodyHWRatio = opt?.bodyHWRatio || 2 return checkPersonImage(avatarImage, windowSize).pipe( Effect.tap(a => McpLogService.logTrace( `check runner image:${retry},${JSON.stringify(a)},${a.number}${a.number > bodyAreaRatio ? '>' : '<'}${bodyAreaRatio},${a.alphaNum.rect.h / a.alphaNum.rect.w}${a.alphaNum.rect.h / a.alphaNum.rect.w > bodyHWRatio ? '>' : '<'}${bodyHWRatio}`)), //, retry, number, alphaNum.rect.w, alphaNum.rect.h\ Effect.andThen(a => { // 非透明度が0.02以上かつ範囲の縦と横の比率が3:1以上なら完了 counterfeit V3=0.015, counterfeit LX 0.03 にしてみる // 比率値を3から2.5にしてみる。ダメ映像が増えたらまた調整する。。非透明率を0.015にしてみる return a.number > bodyAreaRatio && a.alphaNum.rect.h / a.alphaNum.rect.w > bodyHWRatio ? Effect.succeed(avatarImage) : Effect.fail(new Error('avatar fail')); }) ); }), Effect.retry(Schedule.recurs(2).pipe(Schedule.intersect(Schedule.spaced("5 seconds")))) ) const stayImage = yield* Effect.tryPromise(() => { return sharp(innerImage).composite([{ input: avatarImage, left: shiftX, top: innerSize.h - windowSize.h }]).toBuffer() }).pipe(Effect.andThen(a => Effect.tryPromise(() => sharp(a).extract({ left: (innerSize.w - outSize.w) / 2, top: (innerSize.h - outSize.h) / 2, width: outSize.w, height: outSize.h }).resize({width: 512, height: 512}).png().toBuffer()))) // 現状のClaude MCPだと512*512以上のbase64はエラーになりそう recentImage = stayImage yield* McpLogService.logTrace(`stayImage:${recentImage?.length}`) return { buf: stayImage, shiftX, shiftY: innerSize.h - windowSize.h, fit: !isFixedBody, append: appendPrompt } } ) } /** * 旅画像生成V4 * nano-banana版 * @param basePhoto * @param modelPhotoUri * @param withAbort * @param localDebug */ function makeRunnerImageV4( basePhoto: Buffer, modelPhotoUri?: string, withAbort = false, localDebug = false, ) { return Effect.gen(function* () { const env = yield* DbService.getSysEnv() if (!env.GeminiImageApi_key) { return yield* Effect.fail(new Error('no key')) } const maxRetry = env.maxRetryGemini ? (Number.parseInt(env.maxRetryGemini) || 0) : 0 const gen = yield* GeminiImageGenerator.make(env.GeminiImageApi_key); const {widthOut, heightOut} = yield* getImageOutSize() const baseCharPrompt = yield* getBasePrompt(defaultAvatarId) const photo = yield* Effect.tryPromise(_ => sharp(basePhoto).resize({ width: 512, // 最小 256 最大768 とのこと height: 512 }).png().toBuffer()) return yield* Effect.gen(function* () { let addPrompt = '' let charImage:Buffer|undefined const {prompt, append} = yield* generatePromptV4(baseCharPrompt, false, withAbort); if (modelPhotoUri) { charImage = yield* getAvatarTemplateImage(modelPhotoUri); addPrompt = `Add the girl in the second image ${append}, to the first image. Matching colors and shadows to the landscape.` // addPrompt = 'Create a new image by combining the elements from the provided images. Add a realistic anime girl in the second image to the first image. Natural coloring that blends in with the surroundings.'+append } else { addPrompt = 'Using the provided image, add a realistic anime girl,Matching colors and shadows to the landscape.' + prompt } const res = yield* gen.execLlm(addPrompt, photo, charImage) // nano-banana向けプロンプト追記 +prompt const imageOut = yield* gen.toAnswerOut(res) const out = yield* Effect.tryPromise(_ => sharp(imageOut).resize({ width: widthOut, height: heightOut }).png().toBuffer()) recentImage = out return { buf: out, shiftX: 0, shiftY: 0, fit: false, append: '' } }).pipe( Effect.timeout('1 minute'), Effect.retry(Schedule.recurs(maxRetry).pipe(Schedule.intersect(Schedule.spaced('5 seconds')))), Effect.catchIf(a => a instanceof TimeoutException, _ => Effect.fail(new Error(`gemini API error:timeout`))),) }) } function geminiMakeImage(prompt: string, runnerEnv: TravelerEnv, inImage?: Buffer, opt?: Record<string, any>) { return Effect.gen(function* () { if (!runnerEnv.GeminiImageApi_key) { return yield* Effect.fail(new Error('no key')) } const gen = yield* GeminiImageGenerator.make(runnerEnv.GeminiImageApi_key); const {widthOut, heightOut} = yield* getImageOutSize() const photo = inImage ? yield* Effect.tryPromise(_ => sharp(inImage).resize({ width: 512, // 最小 256 最大768 とのこと height: 512 }).png().toBuffer()) : runnerEnv.avatar_image_uri ? yield* getAvatarTemplateImage(runnerEnv.avatar_image_uri):undefined const res = yield* gen.execLlm(prompt, photo) // nano-banana向けプロンプト追記 +prompt const imageOut = yield* gen.toAnswerOut(res) return yield* Effect.tryPromise(_ => sharp(imageOut).resize({ width: widthOut, height: heightOut }).png().toBuffer()) }) } function getRecentImageAndClear() { const image = recentImage recentImage = undefined return image } function mergeParams(baseScript: any, map: Map<string, number>, params: Record<string, string | number>) { let scr = JSON.stringify(baseScript) // jsonPathで置き換えてるからbaseScriptのshallow copyは必要ないはず Object.keys(params).forEach(key => { const val = params[key]; const reg = new RegExp(`"${key}"`, "g") scr = scr.replaceAll(reg, typeof val === "number" ? val.toString() : `"${val.toString()}"`) }) return JSON.parse(scr) } function comfyUploadImage(inImage: Buffer, runnerEnv: TravelerEnv, opt?: { width?: number, height?: number, }) { // TODO comfyの場合のファイルアップロード。。 const nowMs = dayjs().valueOf() const fileName = `trv${nowMs}` return Effect.tryPromise(() => sharp(inImage).resize({ width: opt?.width || 1024, height: opt?.height || 1024 }).png().toBuffer()).pipe( Effect.andThen(a => Effect.tryPromise({ try: () => { const formData = new FormData() formData.append('image', a, {filename: fileName}) return fetch( `${runnerEnv.comfy_url}/upload/image`, { method: 'POST', headers: { ...formData.getHeaders(), Accept: 'application/json', }, // @ts-ignore body: formData.getBuffer(), } ) }, catch: error => new Error(`${error}`) })), Effect.andThen(a => a.json()), Effect.andThen(a => a as { name: string, subfolder: string, type: string }), Effect.andThen(a => a.name), Effect.tapError(cause => Effect.logError(cause)), Effect.retry(Schedule.recurs(1).pipe(Schedule.intersect(Schedule.spaced("3 seconds")))), ) } function comfyUpExecPrompt(script: any) { // TODO comfyの場合のファイルアップロード。。 return Effect.gen(function* () { const runnerEnv = yield* DbService.getSysEnv() const client = yield* HttpClient.HttpClient; return yield* HttpClientRequest.post(`${runnerEnv.comfy_url}/prompt`).pipe( HttpClientRequest.setHeaders({ Accept: "application/json", }), HttpClientRequest.bodyJson({ prompt: script, }), Effect.flatMap(client.execute), Effect.flatMap(a => a.json), Effect.andThen((a: any) => { // TODO うまくSchema.decode出来なかったので雑にキャストする if (a.error) { return Effect.fail(new Error(`ComfyUI error:${JSON.stringify(a.node_errors)}`)) } return Effect.succeed(a as { prompt_id: string }) }), Effect.tapError(McpLogService.logError), Effect.tap(a => McpLogService.logTrace(a)), Effect.retry(Schedule.recurs(1).pipe(Schedule.intersect(Schedule.spaced("5 seconds")))), Effect.scoped, ) }) } function downloadOutput(prompt_id: string, runnerEnv: TravelerEnv, needKeyNum: number = 1) { const sc = Schema.Record({ key: Schema.String, value: Schema.Struct({ outputs: Schema.Record({ key: Schema.String, value: Schema.Struct({ images: Schema.Array(Schema.Struct({ filename: Schema.String, subfolder: Schema.String, type: Schema.String })) }) }) }) }) return HttpClient.get(`${runnerEnv.comfy_url}/history`).pipe( Effect.andThen((response) => HttpClientResponse.schemaBodyJson(sc)(response)), Effect.scoped, Effect.andThen((a1: any) => { const prOut = a1[prompt_id] if (!prOut) { // TODO ここの書き方どうなるんだろう? return Effect.fail(new Error('wait not ready')) } const outputs = prOut.outputs const keys = Object.keys(outputs); return Effect.forEach(keys, a => { const imageList: { filename: string, subfolder: string, type: string }[] = outputs[a].images return Effect.forEach(imageList, a2 => HttpClient.get(`${runnerEnv.comfy_url}/view`, { urlParams: { filename: a2.filename, subfolder: a2.subfolder, type: a2.type } }).pipe( Effect.andThen((response) => response.arrayBuffer), Effect.scoped, )) }) }), Effect.retry(Schedule.recurs(44).pipe(Schedule.intersect(Schedule.spaced("10 seconds")))), Effect.andThen(a => a.flat()) ) } function comfyApiMakeImage(prompt: string, inImage?: Buffer, params?: Record<string, any>) { return Effect.gen(function* () { const runnerEnv = yield* DbService.getSysEnv() if (!runnerEnv.comfy_url) { return yield* Effect.fail(new Error('no comfy_url')) } const logTotal = params?.logTotal const logProgress = params?.logProgress yield* Effect.fork(progress(logTotal || 1, logProgress || 0, runnerEnv.mode)) const uploadFileName = inImage ? yield* comfyUploadImage(inImage, runnerEnv, params,).pipe(Effect.andThen(a => Effect.succeedSome(a))) : Option.none() // uploadFileNameはプロンプトスクリプト内で置き換えなければならないので const scriptName = inImage ? (runnerEnv.comfy_workflow_i2i ? 'i2i' : 'i2i_sample') : (runnerEnv.comfy_workflow_t2i ? 't2i' : 't2i_sample') const scriptTables = yield* DbService.getScriptTable() const sdT2i = scriptTables.get(scriptName); if (!sdT2i) { return yield* Effect.fail(new Error('comfyApiMakeImage no script table')) } const mappedRecord = params ? Object.fromEntries( Object.entries(params).map(([key, value]) => [`%${key}`, value]) ) as Record<string, any> : {}; const modelParams: Record<string, string | number> = { "%seed": params?.seed && params?.seed >= 0 ? params.seed : Math.floor(Math.random() * 999999999999999), // TODO randomは0か? どうもComfyは今randomの設定がないようだ。。。負数なら15桁の9をベースに乱数とする "%steps": params?.steps || 20, // 20->8 "%cfg": params?.cfg || 6, // 8->1.5 "%sampler_name": params?.sampler_name || 'euler', "%scheduler": params?.scheduler || 'normal', "%denoise": params?.denoise || 0.7, //0.63, "%ckpt_name": params?.ckpt_name || 'v1-5-pruned-emaonly-fp16.safetensors', "%prompt": prompt, "%negative_prompt": params?.negative_prompt || 'nsfw, text, watermark', "%width": params?.width || 1024, "%height": params?.height || 1024 }; const outParam = {...mappedRecord, ...modelParams} if (Option.isSome(uploadFileName)) { outParam["%uploadFileName"] = uploadFileName.value } const script = mergeParams(sdT2i.script, sdT2i.nodeNameToId, outParam) const ret = yield* comfyUpExecPrompt(script) return yield* downloadOutput(ret.prompt_id, runnerEnv, 1).pipe( Effect.tap(a => a.length !== 1 && a.length !== 2 && Effect.fail(new Error('download fail'))), Effect.andThen(a => Buffer.from(a[0]))) }); } function shrinkImage(image: Buffer) { return Effect.gen(function* () { const {widthOut, heightOut} = yield* getImageOutSize() return yield* Effect.tryPromise(() => sharp(image).resize({ width: widthOut, height: heightOut }).png().toBuffer()) }) } function getAvatarTemplateImage(modelPhotoUri: string) { const strings = modelPhotoUri.split('|'); let uri = modelPhotoUri if (strings.length > 1) { uri = strings[Math.floor(Math.random() * strings.length)] } return Effect.gen(function *() { let likeBuffer: Buffer if (uri.startsWith('file://')) { const filePath = fileURLToPath(new URL(uri)); likeBuffer = fs.readFileSync(filePath); } else if (uri.startsWith('https://') || uri.startsWith('http://')) { likeBuffer = yield * HttpClient.get(uri).pipe( Effect.andThen((response) => response.arrayBuffer), Effect.andThen(a => Buffer.from(a)), Effect.scoped, ) } return yield * Effect.tryPromise(_ => sharp(likeBuffer).resize({ width: 512, // 最小 256 最大768 とのこと height: 512 }).png().toBuffer()) }) } return { getRecentImageAndClear, makeHotelPict, makeEtcTripImage, makeRunnerImageV3, makeRunnerImageV4, selectImageGenerator, generatePrompt, getBasePrompt, comfyApiMakeImage, rembgService, rembgApi, shrinkImage, isEnableRembg, getImageOutSize, } }), }) { } export const ImageServiceLive = ImageService.Default

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/mfukushim/map-traveler-mcp'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

ImageService.ts•50.5 KiB