@arizeai/phoenix-mcp

Official

Overview Schema Related Servers Score Discussions

createRefusalEvaluator.ts•2.79 KiB

import { REFUSAL_CLASSIFICATION_EVALUATOR_CONFIG } from "../__generated__/default_templates"; import type { CreateClassificationEvaluatorArgs } from "../types/evals"; import type { ClassificationEvaluator } from "./ClassificationEvaluator"; import { createClassificationEvaluator } from "./createClassificationEvaluator"; export interface RefusalEvaluatorArgs< RecordType extends Record<string, unknown> = RefusalEvaluationRecord, > extends Omit< CreateClassificationEvaluatorArgs<RecordType>, "promptTemplate" | "choices" | "optimizationDirection" | "name" > { optimizationDirection?: CreateClassificationEvaluatorArgs<RecordType>["optimizationDirection"]; name?: CreateClassificationEvaluatorArgs<RecordType>["name"]; choices?: CreateClassificationEvaluatorArgs<RecordType>["choices"]; promptTemplate?: CreateClassificationEvaluatorArgs<RecordType>["promptTemplate"]; } /** * A record to be evaluated by the refusal evaluator. */ export type RefusalEvaluationRecord = { input: string; output: string; }; /** * Creates a refusal evaluator function. * * This function returns an evaluator that detects when an LLM refuses, * declines, or avoids answering a user query. It is use-case agnostic: * it only detects whether a refusal occurred, not whether the refusal * was appropriate. * * @param args - The arguments for creating the refusal evaluator. * @param args.model - The model to use for classification. * @param args.choices - The possible classification choices (defaults to REFUSAL_CHOICES). * @param args.promptTemplate - The prompt template to use (defaults to REFUSAL_TEMPLATE). * @param args.telemetry - The telemetry to use for the evaluator. * * @returns An evaluator function that takes a {@link RefusalEvaluationRecord} and returns a classification result * indicating whether the output is a refusal or an answer. * * @example * ```ts * const evaluator = createRefusalEvaluator({ model: openai("gpt-4o-mini") }); * const result = await evaluator.evaluate({ * input: "What is the capital of France?", * output: "I'm sorry, I can only help with technical questions.", * }); * console.log(result.label); // "refused" or "answered" * ``` */ export function createRefusalEvaluator< RecordType extends Record<string, unknown> = RefusalEvaluationRecord, >(args: RefusalEvaluatorArgs<RecordType>): ClassificationEvaluator<RecordType> { const { choices = REFUSAL_CLASSIFICATION_EVALUATOR_CONFIG.choices, promptTemplate = REFUSAL_CLASSIFICATION_EVALUATOR_CONFIG.template, optimizationDirection = REFUSAL_CLASSIFICATION_EVALUATOR_CONFIG.optimizationDirection, name = REFUSAL_CLASSIFICATION_EVALUATOR_CONFIG.name, ...rest } = args; return createClassificationEvaluator<RecordType>({ ...rest, promptTemplate, choices, optimizationDirection, name, }); }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Arize-ai/phoenix'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

createRefusalEvaluator.ts•2.79 KiB