@arizeai/phoenix-mcp

Official

Overview Schema Related Servers Score Discussions

evaluatorStore.tsx•18.5 KiB

import mergeWith from "lodash-es/mergeWith"; import invariant from "tiny-invariant"; import { createStore } from "zustand"; import { devtools } from "zustand/middleware"; import { DEFAULT_EVALUATOR_TEMPLATE } from "@phoenix/components/evaluators/templates/defaultEvaluatorTemplate"; import type { ClassificationChoice, ClassificationEvaluatorAnnotationConfig, ContinuousEvaluatorAnnotationConfig, EvaluatorInputMapping, EvaluatorKind, EvaluatorMappingSource, EvaluatorOptimizationDirection, } from "@phoenix/types"; import type { DeepPartial } from "@phoenix/typeUtils"; import { compressObject } from "@phoenix/utils/objectUtils"; /** * Union type for annotation configs (categorical or continuous). */ export type AnnotationConfig = | ClassificationEvaluatorAnnotationConfig | ContinuousEvaluatorAnnotationConfig; export type EvaluatorStoreProps = { datasetEvaluator?: { id: string; }; evaluator: { id?: string; /** The global/internal name of the base evaluator (e.g., "hallucination") */ globalName: string; /** The user-facing name for this dataset evaluator instance */ name: string; inputMapping: EvaluatorInputMapping; kind: EvaluatorKind; description: string; isBuiltin: boolean; includeExplanation: boolean; }; /** * Array of output configurations for multi-output evaluators. * Each config defines an annotation that the evaluator will produce. */ outputConfigs: AnnotationConfig[]; dataset?: { id: string; readonly: boolean; selectedExampleId: string | null; selectedSplitIds: string[]; }; evaluatorMappingSource: EvaluatorMappingSource; showPromptPreview: boolean; }; export type EvaluatorStoreActions = { /** Sets the global/internal name of the base evaluator. */ setEvaluatorGlobalName: (globalName: string) => void; /** Sets the user-facing name for this dataset evaluator instance. */ setEvaluatorName: (name: string) => void; /** Sets the description of the evaluator. */ setEvaluatorDescription: (description: string) => void; /** Sets whether the evaluator should include an explanation in its output. */ setIncludeExplanation: (includeExplanation: boolean) => void; /** Sets a single path mapping entry by key. */ setInputMappingPath: (path: string, value: string) => void; /** Sets a single literal mapping entry by key. */ setInputMappingLiteral: (literal: string, value: string) => void; /** Replaces the entire path mapping object. */ setPathMapping: (pathMapping: EvaluatorInputMapping["pathMapping"]) => void; /** Replaces the entire literal mapping object. */ setLiteralMapping: ( literalMapping: EvaluatorInputMapping["literalMapping"] ) => void; /** Sets the dataset configuration for the evaluator. */ setDataset: (dataset: EvaluatorStoreProps["dataset"]) => void; /** Sets the dataset ID, or clears the dataset if null. */ setDatasetId: (datasetId: string | null) => void; /** Sets the evaluator mapping source data (input, output, reference). */ setEvaluatorMappingSource: ( evaluatorMappingSource: EvaluatorMappingSource ) => void; /** Sets a single field of the evaluator mapping source. */ setEvaluatorMappingSourceField: ( field: keyof EvaluatorMappingSource, value: Record<string, unknown> ) => void; /** Sets the currently selected example ID within the dataset. */ setSelectedExampleId: (selectedExampleId?: string | null) => void; /** Sets the selected split IDs for filtering dataset examples. */ setSelectedSplitIds: (selectedSplitIds: string[]) => void; /** Sets whether to show the prompt preview panel. */ setShowPromptPreview: (showPromptPreview: boolean) => void; // Multi-output config CRUD actions /** Adds a new output config to the array. */ addOutputConfig: (config: AnnotationConfig) => void; /** Removes an output config at the specified index. */ removeOutputConfig: (index: number) => void; /** Updates an output config at the specified index with partial updates. */ updateOutputConfig: ( index: number, updates: Partial<AnnotationConfig> ) => void; /** Replaces all output configs with a new array. */ setOutputConfigs: (configs: AnnotationConfig[]) => void; /** Sets the name of the output config at a specific index. */ setOutputConfigNameAtIndex: (index: number, name: string) => void; /** Sets the optimization direction of the output config at a specific index. */ setOutputConfigOptimizationDirectionAtIndex: ( index: number, optimizationDirection: EvaluatorOptimizationDirection ) => void; /** Sets the classification choices for the output config at a specific index. */ setOutputConfigValuesAtIndex: ( index: number, values: ClassificationChoice[] ) => void; /** Registers a sub-form's trigger function for validation on submit. Returns an unregister callback. */ registerValidator: ( key: string, trigger: () => Promise<boolean> ) => () => void; /** Triggers validation on all registered sub-forms. Returns true if all are valid. */ validateAll: () => Promise<boolean>; }; export type EvaluatorStore = EvaluatorStoreProps & EvaluatorStoreActions; /** * Default value for the evaluator mapping source. */ export const EVALUATOR_MAPPING_SOURCE_DEFAULT: EvaluatorMappingSource = { input: {}, output: { messages: [ { role: "assistant", content: "[SAMPLE] Replace this with your actual task output format", tool_calls: [ { function: { name: "example_function", arguments: '{"param": "example_value"}', }, }, ], }, ], available_tools: [ { type: "function", function: { name: "example_function", description: "[SAMPLE] Example tool definition", parameters: { type: "object", properties: { param: { type: "string", description: "Example parameter", }, }, required: ["param"], }, }, }, ], }, reference: {}, metadata: {}, }; /** * Default value for the evaluator mapping source as a string. */ export const EVALUATOR_MAPPING_SOURCE_DEFAULT_STRING = JSON.stringify( EVALUATOR_MAPPING_SOURCE_DEFAULT, null, 2 ); /** * Common default values for all evaluator kinds. */ export const DEFAULT_STORE_VALUES = { evaluator: { globalName: "", name: "", description: "", inputMapping: { literalMapping: {}, pathMapping: {}, }, includeExplanation: true, }, evaluatorMappingSource: EVALUATOR_MAPPING_SOURCE_DEFAULT, showPromptPreview: false, outputConfigs: [] as AnnotationConfig[], } satisfies DeepPartial<EvaluatorStoreProps>; /** * Default output config for LLM evaluators. */ const DEFAULT_LLM_OUTPUT_CONFIG: ClassificationEvaluatorAnnotationConfig = { ...DEFAULT_EVALUATOR_TEMPLATE.outputConfigs[0], }; /** * Default values for LLM evaluators. */ export const DEFAULT_LLM_EVALUATOR_STORE_VALUES = { ...DEFAULT_STORE_VALUES, evaluator: { ...DEFAULT_STORE_VALUES.evaluator, kind: "LLM", isBuiltin: false, }, outputConfigs: [DEFAULT_LLM_OUTPUT_CONFIG], } satisfies EvaluatorStoreProps; /** * Default values for CODE evaluators. */ export const DEFAULT_CODE_EVALUATOR_STORE_VALUES = { ...DEFAULT_STORE_VALUES, evaluator: { ...DEFAULT_STORE_VALUES.evaluator, kind: "BUILTIN", isBuiltin: true, }, outputConfigs: [], } satisfies EvaluatorStoreProps; export const createEvaluatorStore = ( props: Partial<EvaluatorStoreProps> & { evaluator: { kind: EvaluatorKind } } ) => { /** * Registry of sub-form trigger functions for validation on submit. * Stored outside Zustand's reactive state so that registering/unregistering * validators (which happens on every sub-form mount/unmount) does not cause * re-renders in consuming components. */ const validators = new Map<string, () => Promise<boolean>>(); return createStore<EvaluatorStore>()( devtools( (set, get) => { const properties = mergeWith( {}, DEFAULT_STORE_VALUES, props.evaluator.kind === "LLM" ? DEFAULT_LLM_EVALUATOR_STORE_VALUES : {}, props.evaluator.kind === "BUILTIN" ? DEFAULT_CODE_EVALUATOR_STORE_VALUES : {}, props, (_objValue: unknown, srcValue: unknown) => Array.isArray(srcValue) ? srcValue : undefined ) satisfies EvaluatorStoreProps; const actions = { setEvaluatorGlobalName(globalName) { set( { evaluator: { ...get().evaluator, globalName }, }, undefined, "setEvaluatorGlobalName" ); if (get().outputConfigs.length <= 1) { get().setOutputConfigNameAtIndex(0, globalName); } }, setEvaluatorName(name) { set( { evaluator: { ...get().evaluator, name }, }, undefined, "setEvaluatorName" ); if (get().outputConfigs.length <= 1) { get().setOutputConfigNameAtIndex(0, name); } }, setEvaluatorDescription(description) { set( { evaluator: { ...get().evaluator, description } }, undefined, "setEvaluatorDescription" ); }, setPathMapping(pathMapping) { const newPathMapping = // filter out undefined and empty key value pairs compressObject(pathMapping) ?? {}; set( { evaluator: { ...get().evaluator, inputMapping: { ...get().evaluator.inputMapping, // We have to perform this cast because the type system cannot distinguish between // a partial object where some keys are actually missing, and a partial object where some keys have undefined values. pathMapping: newPathMapping as unknown as Record< string, string >, }, }, }, undefined, "setPathMapping" ); }, setLiteralMapping(literalMapping) { const newLiteralMapping = // filter out undefined and empty key value pairs compressObject(literalMapping) ?? {}; set( { evaluator: { ...get().evaluator, inputMapping: { ...get().evaluator.inputMapping, literalMapping: newLiteralMapping as unknown as Record< string, boolean | string | number >, }, }, }, undefined, "setLiteralMapping" ); }, setInputMappingPath(path, value) { const newPathMapping = // filter out undefined and empty key value pairs compressObject({ ...get().evaluator.inputMapping.pathMapping, [path]: value, }) ?? {}; set( { evaluator: { ...get().evaluator, inputMapping: { ...get().evaluator.inputMapping, // We have to perform this cast because the type system cannot distinguish between // a partial object where some keys are actually missing, and a partial object where some keys have undefined values. pathMapping: newPathMapping as unknown as Record< string, string >, }, }, }, undefined, "setInputMappingPath" ); }, setInputMappingLiteral(literal, value) { const newLiteralMapping = // filter out undefined and empty key value pairs compressObject({ ...get().evaluator.inputMapping.literalMapping, [literal]: value, }) ?? {}; set( { evaluator: { ...get().evaluator, inputMapping: { ...get().evaluator.inputMapping, literalMapping: newLiteralMapping as unknown as Record< string, boolean | string | number >, }, }, }, undefined, "setInputMappingLiteral" ); }, setDataset(dataset) { set({ dataset }, undefined, "setDataset"); }, setDatasetId(datasetId) { if (datasetId == null) { set({ dataset: undefined }); return; } const baseDataset = get().dataset; invariant(baseDataset, "Dataset is required to set dataset id"); set( { dataset: { ...baseDataset, id: datasetId } }, undefined, "setDatasetId" ); }, setEvaluatorMappingSource(evaluatorMappingSource) { set( { evaluatorMappingSource }, undefined, "setEvaluatorMappingSource" ); }, setEvaluatorMappingSourceField(field, value) { set( { evaluatorMappingSource: { ...get().evaluatorMappingSource, [field]: value, }, }, undefined, "setEvaluatorMappingSourceField" ); }, setSelectedExampleId(selectedExampleId) { const baseDataset = get().dataset; invariant( baseDataset, "Dataset is required to set selected example id" ); set( { dataset: { ...baseDataset, selectedExampleId: selectedExampleId ?? null, }, }, undefined, "setSelectedExampleId" ); }, setSelectedSplitIds(selectedSplitIds) { const baseDataset = get().dataset; invariant( baseDataset, "Dataset is required to set selected split ids" ); set( { dataset: { ...baseDataset, selectedSplitIds } }, undefined, "setSelectedSplitIds" ); }, setShowPromptPreview(showPromptPreview) { set({ showPromptPreview }, undefined, "setShowPromptPreview"); }, setIncludeExplanation(includeExplanation) { set( { evaluator: { ...get().evaluator, includeExplanation } }, undefined, "setIncludeExplanation" ); }, // Multi-output config CRUD actions addOutputConfig(config) { const currentConfigs = get().outputConfigs; set( { outputConfigs: [...currentConfigs, config] }, undefined, "addOutputConfig" ); }, removeOutputConfig(index) { const currentConfigs = get().outputConfigs; const newConfigs = currentConfigs.filter((_, i) => i !== index); set( { outputConfigs: newConfigs, }, undefined, "removeOutputConfig" ); }, updateOutputConfig(index, updates) { const currentConfigs = get().outputConfigs; if (index < 0 || index >= currentConfigs.length) return; const newConfigs = [...currentConfigs]; newConfigs[index] = { ...newConfigs[index], ...updates }; set({ outputConfigs: newConfigs }, undefined, "updateOutputConfig"); }, setOutputConfigs(configs) { set({ outputConfigs: configs }, undefined, "setOutputConfigs"); }, setOutputConfigNameAtIndex(index, name) { const currentConfigs = get().outputConfigs; if (index < 0 || index >= currentConfigs.length) return; const newConfigs = [...currentConfigs]; newConfigs[index] = { ...newConfigs[index], name }; set( { outputConfigs: newConfigs }, undefined, "setOutputConfigNameAtIndex" ); }, setOutputConfigOptimizationDirectionAtIndex( index, optimizationDirection ) { const currentConfigs = get().outputConfigs; if (index < 0 || index >= currentConfigs.length) return; const newConfigs = [...currentConfigs]; newConfigs[index] = { ...newConfigs[index], optimizationDirection }; set( { outputConfigs: newConfigs }, undefined, "setOutputConfigOptimizationDirectionAtIndex" ); }, setOutputConfigValuesAtIndex(index, values) { const currentConfigs = get().outputConfigs; if (index < 0 || index >= currentConfigs.length) return; const newConfigs = [...currentConfigs]; // Only update if it's a classification config const currentConfig = newConfigs[index]; if ("values" in currentConfig) { newConfigs[index] = { ...currentConfig, values }; set( { outputConfigs: newConfigs }, undefined, "setOutputConfigValuesAtIndex" ); } }, registerValidator(key, trigger) { validators.set(key, trigger); return () => { validators.delete(key); }; }, async validateAll() { const results = await Promise.all( Array.from(validators.values()).map((trigger) => trigger()) ); return results.every(Boolean); }, } satisfies EvaluatorStoreActions; return { ...properties, ...actions, }; }, { name: "evaluatorStore", } ) ); }; export type EvaluatorStoreInstance = ReturnType<typeof createEvaluatorStore>;

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Arize-ai/phoenix'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

evaluatorStore.tsx•18.5 KiB