Medplum

Official

Overview Schema Related Servers Score Discussions

token-column.ts•13.2 KiB

// SPDX-FileCopyrightText: Copyright Orangebot, Inc. and Medplum contributors // SPDX-License-Identifier: Apache-2.0 import type { Filter, SortRule } from '@medplum/core'; import { Operator as FhirOperator, invalidSearchOperator, OperationOutcomeError, splitN, splitSearchOnComma, } from '@medplum/core'; import type { Resource, ResourceType, SearchParameter } from '@medplum/fhirtypes'; import { NIL, v5 } from 'uuid'; import type { TokenColumnSearchParameterImplementation } from './searchparameter'; import { getSearchParameterImplementation } from './searchparameter'; import type { Expression, SelectQuery } from './sql'; import { Column, Condition, Disjunction, Negation, TypedCondition } from './sql'; import type { Token } from './tokens'; import { buildTokensForSearchParameter, shouldTokenExistForMissingOrPresent } from './tokens'; const DELIM = '\x01'; const NULL_SYSTEM = '\x02'; const ARRAY_DELIM = '\x03'; // If `ARRAY_DELIM` changes, the `token_array_to_text` function will be outdated. const TEXT_SEARCH_SYSTEM = '\x04'; export function buildTokenColumns( searchParam: SearchParameter, impl: TokenColumnSearchParameterImplementation, columns: Record<string, any>, resource: Resource ): void { const allTokens: Token[] = []; buildTokensForSearchParameter(allTokens, resource, searchParam, TEXT_SEARCH_SYSTEM); // search parameters may share columns, so add any existing tokens to the set const tokens = new Set<string>(columns[impl.tokenColumnName]); const textSearchTokens = new Set<string>(columns[impl.textSearchColumnName]); let sortColumnValue: string | null = null; for (const t of allTokens) { const code = t.code; const system = t.system?.trim?.(); let value = t.value?.trim?.(); if (!code || (!system && !value)) { continue; } if (value && impl.caseInsensitive) { value = value.toLocaleLowerCase(); } // sanity check if (code !== searchParam.code) { throw new Error(`Invalid token code ${code} for search parameter with code ${searchParam.code}`); } // text search if (value && (system === TEXT_SEARCH_SYSTEM || impl.textSearch)) { if (impl.hasDedicatedColumns) { textSearchTokens.add(value); } else { textSearchTokens.add(code + DELIM + value); } /* Ideally we could continue here when system === TEXT_SEARCH_SYSTEM, but right now Medplum supports exact searches on the text content as if it were a normal token value, e.g. the following resource should match the search `Task?code=cursor_test` { resourceType: 'Task', status: 'accepted', intent: 'order', code: { text: 'cursor_test' }, } */ } // :missing/:present - in a token column per search parameter, the presence of any elements // in the main token column, `impl.tokenColumnName`, is sufficient. if (!impl.hasDedicatedColumns) { addHashedToken(tokens, code); } const prefix = impl.hasDedicatedColumns ? '' : code + DELIM; // The TEXT_SEARCH_SYSTEM is never searchable if (system && system !== TEXT_SEARCH_SYSTEM) { // [parameter]=[system]| addHashedToken(tokens, prefix + system); if (value) { // [parameter]=[system]|[code] addHashedToken(tokens, prefix + system + DELIM + value); } } if (value) { sortColumnValue = sortColumnValue && sortColumnValue.localeCompare(value) <= 0 ? sortColumnValue : value; // [parameter]=[code] addHashedToken(tokens, prefix + DELIM + value); if (!system) { // [parameter]=|[code] addHashedToken(tokens, prefix + NULL_SYSTEM + DELIM + value); } } } columns[impl.tokenColumnName] = Array.from(tokens); columns[impl.textSearchColumnName] = Array.from(textSearchTokens); columns[impl.sortColumnName] = sortColumnValue; } function addHashedToken(tokenSet: Set<string>, token: string): void { tokenSet.add(hashTokenColumnValue(token)); } export function hashTokenColumnValue(value: string): string { return v5(value, NIL); } /** * Adds "order by" clause to the select query builder. * @param selectQuery - The select query builder. * @param impl - The search parameter implementation. * @param sortRule - The sort rule details. */ export function addTokenColumnsOrderBy( selectQuery: SelectQuery, impl: TokenColumnSearchParameterImplementation, sortRule: SortRule ): void { /* [R4 spec behavior](https://www.hl7.org/fhir/r4/search.html#_sort): A search parameter can refer to an element that repeats, and therefore there can be multiple values for a given search parameter for a single resource. In this case, the sort is based on the item in the set of multiple parameters that comes earliest in the specified sort order when ordering the returned resources. In [R5](https://www.hl7.org/fhir/r5/search.html#_sort) and beyond, that language is replaced with: Servers have discretion on the implementation of sorting for both repeated elements and complex elements. For example, if requesting a sort on Patient.name, servers might search by family name then given, given name then family, or prefix, family, and then given. Similarly, when sorting with multiple given names, the sort might be based on the 'earliest' name in sort order or the first name in the instance. Current behavior: Sorts by the alphabetically first value found in the token array. This can result in possibly unexpected/surprising result ordering when a resource has multiple token values for the same code. To avoid the surprising behavior, we could store both the alphabetically first and last values for each search parameter. */ selectQuery.orderBy(new Column(undefined, impl.sortColumnName), sortRule.descending); } export function buildTokenColumnsSearchFilter( resourceType: ResourceType, tableName: string, param: SearchParameter, filter: Filter ): Expression { const impl = getSearchParameterImplementation(resourceType, param); if (impl.searchStrategy !== 'token-column') { throw new Error('Invalid search strategy: ' + impl.searchStrategy); } switch (filter.operator) { case FhirOperator.TEXT: case FhirOperator.CONTAINS: { filter.operator satisfies TokenQueryOperator; // https://www.hl7.org/fhir/r4/search.html#combining const expressions = buildTokenColumnsWhereConditionTextAndContains( impl, tableName, filter.code, filter.operator, filter.value ); const expression = new Disjunction(expressions); return expression; } case FhirOperator.EQUALS: case FhirOperator.EXACT: case FhirOperator.NOT: case FhirOperator.NOT_EQUALS: { filter.operator satisfies TokenQueryOperator; // https://www.hl7.org/fhir/r4/search.html#combining const expression = buildTokenColumnsWhereConditionEqualsAndExact( impl, tableName, filter.code, filter.operator, filter.value ); if (filter.operator === FhirOperator.NOT || filter.operator === FhirOperator.NOT_EQUALS) { return new Negation(expression); } else { return expression; } } case FhirOperator.MISSING: case FhirOperator.PRESENT: { if (!impl.hasDedicatedColumns) { const cond = new TypedCondition( new Column(tableName, impl.tokenColumnName), 'ARRAY_OVERLAPS', hashTokenColumnValue(filter.code), 'UUID[]' ); if (!shouldTokenExistForMissingOrPresent(filter.operator, filter.value)) { return new Negation(cond); } return cond; } if (shouldTokenExistForMissingOrPresent(filter.operator, filter.value)) { return new TypedCondition(new Column(tableName, impl.tokenColumnName), 'ARRAY_NOT_EMPTY', undefined, 'UUID[]'); } else { return new TypedCondition(new Column(tableName, impl.tokenColumnName), 'ARRAY_EMPTY', undefined, 'UUID[]'); } } case FhirOperator.IN: case FhirOperator.NOT_IN: case FhirOperator.STARTS_WITH: case FhirOperator.GREATER_THAN: case FhirOperator.LESS_THAN: case FhirOperator.GREATER_THAN_OR_EQUALS: case FhirOperator.LESS_THAN_OR_EQUALS: case FhirOperator.STARTS_AFTER: case FhirOperator.ENDS_BEFORE: case FhirOperator.APPROXIMATELY: case FhirOperator.IDENTIFIER: case FhirOperator.ITERATE: case FhirOperator.ABOVE: case FhirOperator.BELOW: case FhirOperator.OF_TYPE: throw new OperationOutcomeError(invalidSearchOperator(filter.operator, param.id ?? param.code)); default: { filter.operator satisfies never; throw new OperationOutcomeError(invalidSearchOperator(filter.operator, param.id ?? param.code)); } } } export const TokenQueryOperators = [ FhirOperator.TEXT, FhirOperator.CONTAINS, FhirOperator.EQUALS, FhirOperator.EXACT, FhirOperator.NOT, FhirOperator.NOT_EQUALS, ] as const; type TokenQueryOperator = (typeof TokenQueryOperators)[number]; /** * Build a filter for each comma-separated query value. Negation should NOT be handled here; * the calling function is responsible for negating the disjunction of the expressions returned * by this function. * @param impl - The search parameter implementation. * @param tableName - The table name. * @param code - The search parameter code. * @param operator - The search operator. * @param filterValue - The query value. * @returns The filter expression for the search parameter without negation. */ function buildTokenColumnsWhereConditionTextAndContains( impl: TokenColumnSearchParameterImplementation, tableName: string, code: string, operator: TokenQueryOperator, filterValue: string ): Expression[] { const expressions: Expression[] = []; for (let query of splitSearchOnComma(filterValue)) { query = query.trim(); /* perform a regex search on the string generated by the token_array_to_text function the array entries are of the form `value` and are joined by ARRAY_DELIM as well as having an ARRAY_DELIM prefix and suffix on the entire string: For dedicated-column search parameters, the string being searched by regex is of the form: ARRAY_DELIM + <value1> + ARRAY_DELIM + <value2> + ... + ARRAY_DELIM For non-dedicated-column search parameters, the regex also matches, the format is: ARRAY_DELIM + <code1> + DELIM + <value1> + ARRAY_DELIM + <code2> + DELIM + <value2> + ... + ARRAY_DELIM this regex looks for an entry from the format described above: - `ARRAY_DELIM` - If the search parameter does NOT have dedicated columns, `code + DELIM` - any number of characters that are not `ARRAY_DELIM` (to support infix search) - the query string */ let regexStr: string = '[^' + ARRAY_DELIM + ']*' + escapeRegexString(query); if (impl.hasDedicatedColumns) { regexStr = ARRAY_DELIM + regexStr; } else { regexStr = ARRAY_DELIM + code + DELIM + regexStr; } const textSearchCol = new Column(tableName, impl.textSearchColumnName); const regexCond = new TypedCondition(textSearchCol, 'TOKEN_ARRAY_IREGEX', regexStr, 'TEXT[]'); expressions.push(regexCond); } return expressions; } function buildTokenColumnsWhereConditionEqualsAndExact( impl: TokenColumnSearchParameterImplementation, tableName: string, code: string, operator: TokenQueryOperator, filterValue: string ): Expression { const searchStrings: string[] = []; const queries = splitSearchOnComma(filterValue).map((query) => query.trim()); for (const query of queries) { /* exact matches on the formats: <system>| <system>|<value> |<value> <value> */ let system: string; let value: string; let searchString: string; const parts = splitN(query, '|', 2); if (parts.length === 2) { // If query is "|foo", searching for "foo" values without a system, aka NULL_SYSTEM system = parts[0] || NULL_SYSTEM; // Use || instead of ?? to handle empty strings value = parts[1]; if (value) { value = impl.caseInsensitive ? value.toLocaleLowerCase() : value; searchString = system + DELIM + value; } else { searchString = system; } } else { value = query; value = impl.caseInsensitive ? value.toLocaleLowerCase() : value; searchString = DELIM + value; } if (!impl.hasDedicatedColumns) { searchString = code + DELIM + searchString; } searchString = hashTokenColumnValue(searchString); searchStrings.push(searchString); } const condition = new Condition( new Column(tableName, impl.tokenColumnName), 'ARRAY_OVERLAPS', searchStrings, 'UUID[]' ); return condition; } export function escapeRegexString(str: string): string { // Escape the following special regex characters: // . - matches any single character except newline // ^ - matches the start of a string // $ - matches the end of a string // * - matches 0 or more of the preceding character // + - matches 1 or more of the preceding character // ? - matches 0 or 1 of the preceding character // ( ) - define capturing groups // [ ] - define character classes // { } - define quantifiers // \ - escapes a special character // | - alternation (OR operator) return str.replace(/[.^$*+?()[\]{}\\|]/g, '\\$&'); }

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/medplum/medplum'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

token-column.ts•13.2 KiB