@arizeai/phoenix-mcp

Official

Overview Schema Related Servers Score Discussions

test_query.py•39.6 KiB

from datetime import datetime from typing import Any import pandas as pd import pytest from pandas.testing import assert_frame_equal from sqlalchemy.engine.base import Engine from phoenix.server.types import DbSessionFactory from phoenix.trace.dsl import SpanQuery async def test_select_all( db: DbSessionFactory, abc_project: Any, ) -> None: # i.e. `get_spans_dataframe` sq = SpanQuery() expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "context.trace_id": ["012", "012", "012", "012"], "parent_id": ["123", "234", "234", "234"], "name": ["root span", "embedding span", "retriever span", "llm span"], "span_kind": ["UNKNOWN", "EMBEDDING", "RETRIEVER", "LLM"], "status_code": ["OK", "OK", "OK", "ERROR"], "status_message": ["okay", "no problemo", "okay", "uh-oh"], "start_time": [ datetime.fromisoformat("2021-01-01T00:00:00.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:00.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:05.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:20.000+00:00"), ], "end_time": [ datetime.fromisoformat("2021-01-01T00:00:30.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:05.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:20.000+00:00"), datetime.fromisoformat("2021-01-01T00:00:30.000+00:00"), ], "attributes.input.value": ["xy%z*", "XY%*Z", "xy%*z", None], "attributes.output.value": ["321", None, None, None], "attributes.llm.token_count.prompt": [None, None, None, 100.0], "attributes.llm.token_count.completion": [None, None, None, 200.0], "attributes.metadata": [ None, {"a.b.c": 123, "1.2.3": "abc", "x.y": {"z.a": {"b.c": 321}}}, None, None, ], "attributes.embedding.model_name": [None, "xyz", None, None], "attributes.embedding.embeddings": [ None, [ {"embedding.vector": [1, 2, 3], "embedding.text": "123"}, {"embedding.vector": [2, 3, 4], "embedding.text": "234"}, ], None, None, ], "attributes.retrieval.documents": [ None, None, [ {"document.content": "A", "document.score": 1.0}, {"document.content": "B", "document.score": 2.0}, {"document.content": "C", "document.score": 3.0}, ], None, ], "attributes.attributes": [None, None, "attributes", {"attributes": "attributes"}], "events": [[], [], [], []], } ).set_index("context.span_id", drop=False) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_select_all_with_no_data( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery() expected = pd.DataFrame( columns=[ "context.span_id", "context.trace_id", "parent_id", "name", "span_kind", "status_code", "status_message", "start_time", "end_time", "events", ] ).set_index("context.span_id", drop=False) async with db() as session: actual = await session.run_sync(sq, project_name="opq") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_select( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("name", tcp="llm.token_count.prompt") expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "name": ["root span", "embedding span", "retriever span", "llm span"], "tcp": [None, None, None, 100.0], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_select_parent_id_as_span_id( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("name", span_id="parent_id") expected = pd.DataFrame( { "context.span_id": ["123", "234", "234", "234"], "name": ["root span", "embedding span", "retriever span", "llm span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_select_trace_id_as_index( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("span_id").with_index("trace_id") expected = pd.DataFrame( { "context.trace_id": ["012", "012", "012", "012"], "context.span_id": ["234", "345", "456", "567"], } ).set_index("context.trace_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1).sort_values("context.span_id"), expected.sort_index().sort_index(axis=1).sort_values("context.span_id"), ) async def test_select_nonexistent( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("name", "opq", "opq.rst") expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "name": ["root span", "embedding span", "retriever span", "llm span"], "opq": [None, None, None, None], "opq.rst": [None, None, None, None], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_default_project( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select( "name", **{"Latency (milliseconds)": "latency_ms"}, ) expected = pd.DataFrame( { "context.span_id": ["2345"], "name": ["root span"], "Latency (milliseconds)": [30000.0], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, root_spans_only=True) assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_root_spans_only( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select( "name", **{"Latency (milliseconds)": "latency_ms"}, ) expected = pd.DataFrame( { "context.span_id": ["234"], "name": ["root span"], "Latency (milliseconds)": [30000.0], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc", root_spans_only=True) assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_start_time( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("name") expected = pd.DataFrame( { "context.span_id": ["567"], "name": ["llm span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync( sq, project_name="abc", start_time=datetime.fromisoformat( "2021-01-01T00:00:20.000+00:00", ), ) assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_end_time( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("name") expected = pd.DataFrame( { "context.span_id": ["234", "345"], "name": ["root span", "embedding span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync( sq, project_name="abc", end_time=datetime.fromisoformat( "2021-01-01T00:00:01.000+00:00", ), ) assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_limit( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery() async with db() as session: actual = await session.run_sync(sq, project_name="abc", limit=2) # Newest-first ordering assert actual.index.tolist() == ["567", "456"] async def test_limit_with_select_statement( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().select("context.span_id") expected = pd.DataFrame( { "context.span_id": ["234", "345"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc", limit=2) assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_for_none( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .where( "parent_id is None", ) ) expected = pd.DataFrame( { "context.span_id": [], "name": [], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), check_dtype=False, check_column_type=False, check_frame_type=False, check_index_type=False, ) async def test_filter_for_not_none( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .where( "output.value is not None", ) ) expected = pd.DataFrame( { "context.span_id": ["234"], "name": ["root span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_for_substring_case_sensitive_not_glob_not_like( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("input.value") .where( "'y%*' in input.value", ) ) expected = pd.DataFrame( { "context.span_id": ["456"], "input.value": ["xy%*z"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_for_not_substring_case_sensitive_not_glob_not_like( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("input.value") .where( "'y%*' not in input.value", ) ) expected = pd.DataFrame( { "context.span_id": ["234", "345"], "input.value": ["xy%z*", "XY%*Z"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_nonexistent_is_not_none( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .where( "opq is not None or opq.rst is not None", ) ) expected = pd.DataFrame( columns=["context.span_id", "name"], ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_nonexistent_is_none( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .where( "opq is None or opq.rst is None", ) ) expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "name": ["root span", "embedding span", "retriever span", "llm span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_latency( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select( "name", **{"Latency (milliseconds)": "latency_ms"}, ) .where("9_000 < latency_ms < 11_000") ) expected = pd.DataFrame( { "context.span_id": ["567"], "name": ["llm span"], "Latency (milliseconds)": [10000.0], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_cumulative_token_count( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .where("290 < cumulative_token_count.total < 310 and llm.token_count.prompt is None") ) expected = pd.DataFrame( { "context.span_id": ["234"], "name": ["root span"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_with_arithmetic( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata['a.b.c']") .where( "12 - metadata['a.b.c'] == -111", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata['a.b.c']": [123], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_cast_as_int( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata['a.b.c']") .where( "12 - int(metadata['a.b.c']) == -111", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata['a.b.c']": [123], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_substring_search( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata['1.2.3']") .where( "'b' in metadata['1.2.3']", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata['1.2.3']": ["abc"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_cast_as_str( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata['1.2.3']") .where( "'b' in str(metadata['1.2.3'])", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata['1.2.3']": ["abc"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_using_subscript_key( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata['1.2.3']") .where( "metadata['1.2.3'] == 'abc'", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata['1.2.3']": ["abc"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_using_subscript_keys_list_with_single_key( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata[['1.2.3']]") .where( "metadata[['1.2.3']] == 'abc'", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata[['1.2.3']]": ["abc"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_metadata_using_subscript_keys_list_with_multiple_keys( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("metadata[['x.y', 'z.a']]") .where( "metadata[['x.y', 'z.a', 'b.c']] == 321", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "metadata[['x.y', 'z.a']]": [{"b.c": 321}], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_attribute_using_subscript_key( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("attributes['attributes']") .where( "attributes['attributes'] == 'attributes'", ) ) expected = pd.DataFrame( { "context.span_id": ["456"], "attributes['attributes']": ["attributes"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_attribute_using_subscript_keys_list_with_single_key( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("attributes[['attributes']]") .where( "attributes[['attributes']] == 'attributes'", ) ) expected = pd.DataFrame( { "context.span_id": ["456"], "attributes[['attributes']]": ["attributes"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_attribute_using_subscript_keys_list_with_multiple_keys( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("attributes[['attributes', 'attributes']]") .where( "attributes[['attributes', 'attributes']] == 'attributes'", ) ) expected = pd.DataFrame( { "context.span_id": ["567"], "attributes[['attributes', 'attributes']]": ["attributes"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_span_id_single( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("embedding.model_name") .where( "span_id == '345'", ) ) expected = pd.DataFrame( { "context.span_id": ["345"], "embedding.model_name": ["xyz"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_span_id_multiple( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("embedding.model_name") .where( "span_id in ['345', '567']", ) ) expected = pd.DataFrame( { "context.span_id": ["345", "567"], "embedding.model_name": ["xyz", None], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_trace_id_single( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .where( "trace_id == '012'", ) ) expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "context.trace_id": ["012", "012", "012", "012"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_filter_on_trace_id_multiple( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .where( "trace_id in ('012',)", ) ) expected = pd.DataFrame( { "context.span_id": ["234", "345", "456", "567"], "context.trace_id": ["012", "012", "012", "012"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) @pytest.mark.parametrize( "condition,expected", [ ["evals['0'].score is not None", ["345", "456"]], ["evals['0'].score is None", ["234", "567"]], ["evals['0'].score == 0", ["345"]], ["evals['0'].score != 0", ["456"]], ["evals['0'].score != 0 or evals['0'].score is None", ["234", "456", "567"]], ["evals['1'].label is not None", ["456", "567"]], ["evals['1'].label is None", ["234", "345"]], ["evals['1'].label == '1'", ["456"]], ["evals['1'].label != '1'", ["567"]], ["evals['1'].label != '1' or evals['1'].label is None", ["234", "345", "567"]], ["evals['0'].score is not None or evals['1'].label is not None", ["345", "456", "567"]], ["evals['0'].score is None or evals['1'].label is None", ["234", "345", "567"]], ["evals['0'].score == 0 or evals['1'].label == '1'", ["345", "456"]], ["evals['0'].score != 0 or evals['1'].label != '1'", ["456", "567"]], ["evals['0'].score is not None or evals['1'].label is None", ["234", "345", "456"]], ["evals['0'].score is None or evals['1'].label is not None", ["234", "456", "567"]], ["evals['0'].score == 0 or evals['1'].label != '1'", ["345", "567"]], ["evals['0'].score != 0 or evals['1'].label == '1'", ["456"]], [ "evals['0']", ["345", "456"], ], [ "annotations['0']", ["345", "456"], ], [ "evals['1']", ["456", "567"], ], [ "annotations['1']", ["456", "567"], ], ], ) async def test_filter_on_span_annotation( db: DbSessionFactory, abc_project: Any, condition: str, expected: list[str], ) -> None: sq = SpanQuery().select("span_id").where(condition) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert sorted(actual.index) == expected async def test_explode_embeddings_no_select( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().explode("embedding.embeddings") expected = pd.DataFrame( { "context.span_id": ["345", "345"], "position": [0, 1], "embedding.text": ["123", "234"], "embedding.vector": [[1, 2, 3], [2, 3, 4]], } ).set_index(["context.span_id", "position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_embeddings_with_select_and_no_kwargs( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("embedding.model_name") .explode( "embedding.embeddings", ) ) expected = pd.DataFrame( { "context.span_id": ["345", "345"], "position": [0, 1], "embedding.model_name": ["xyz", "xyz"], "embedding.text": ["123", "234"], "embedding.vector": [[1, 2, 3], [2, 3, 4]], } ).set_index(["context.span_id", "position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_documents_no_select( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().explode( "retrieval.documents", content="document.content", score="document.score", ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "content": ["A", "B", "C"], "score": [1, 2, 3], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_documents_with_select_and_non_ascii_kwargs( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .explode( "retrieval.documents", **{ "콘텐츠": "document.content", "スコア": "document.score", }, ) ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "context.trace_id": ["012", "012", "012"], "콘텐츠": ["A", "B", "C"], "スコア": [1, 2, 3], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_no_select( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().concat( "retrieval.documents", content="document.content", ) expected = pd.DataFrame( { "context.span_id": ["456"], "content": ["A\n\nB\n\nC"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_no_select_but_no_data( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = SpanQuery().concat( "retrieval.documents", content="document.content", ) expected = pd.DataFrame( columns=["context.span_id", "content"], ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="opq") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_with_select( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .concat( "retrieval.documents", content="document.content", ) ) expected = pd.DataFrame( { "context.span_id": ["456"], "context.trace_id": ["012"], "content": ["A\n\nB\n\nC"], } ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_with_select_but_no_data( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .concat( "retrieval.documents", content="document.content", ) ) expected = pd.DataFrame( columns=["context.span_id", "content", "context.trace_id"], ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="opq") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_with_select_but_with_typo_in_array_name( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("trace_id") .concat( "retriever.documents", content="document.content", ) ) expected = pd.DataFrame( columns=["context.span_id", "content", "context.trace_id"], ).set_index("context.span_id") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_concat_documents_with_select_and_non_default_separator( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .with_index("name") .with_concat_separator(",") .concat( "embedding.embeddings", text="embedding.text", ) ) expected = pd.DataFrame( { "name": ["embedding span"], "text": ["123,234"], } ).set_index("name") async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .concat( "retrieval.documents", content="document.content", ) .explode( "retrieval.documents", score="document.score", ) ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "content": ["A\n\nB\n\nC", "A\n\nB\n\nC", "A\n\nB\n\nC"], "score": [1, 2, 3], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array_but_no_data( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .concat( "retrieval.documents", content="document.content", ) .explode( "retrieval.documents", score="document.score", ) ) expected = pd.DataFrame( columns=[ "context.span_id", "document_position", "content", "score", ] ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="opq") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array_with_same_label( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: async with db() as session: assert isinstance(engine := session.get_bind(), Engine) if "asyncpg" in str(engine.url): pytest.xfail("FIX THIS: this test does not currently pass for postgres") sq = ( SpanQuery() .concat( "retrieval.documents", content="document.content", ) .explode( "retrieval.documents", content="document.content", ) ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "content": ["A\n\nB\n\nC", "A\n\nB\n\nC", "A\n\nB\n\nC"], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array_but_with_typo_in_concat_array_name( db: DbSessionFactory, default_project: None, abc_project: None, ) -> None: sq = ( SpanQuery() .concat( "retriever.documents", content="document.content", ) .explode( "retrieval.documents", score="document.score", ) ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "content": [None, None, None], "score": [1, 2, 3], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array_but_with_typo_in_explode_array_name( db: DbSessionFactory, default_project: None, abc_project: None, ) -> None: async with db() as session: assert isinstance(engine := session.get_bind(), Engine) if "asyncpg" in str(engine.url): pytest.xfail("FIX THIS: this test does not currently pass for postgres") sq = ( SpanQuery() .concat( "retrieval.documents", content="document.content", ) .explode( "retriever.documents", score="document.score", ) ) expected = pd.DataFrame( { "context.span_id": ["456"], "content": ["A\n\nB\n\nC"], } ).set_index(["context.span_id"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), ) async def test_explode_and_concat_on_same_array_with_non_ascii_kwargs( db: DbSessionFactory, default_project: Any, abc_project: Any, ) -> None: sq = ( SpanQuery() .select("name") .concat( "retrieval.documents", **{"콘텐츠": "document.content"}, ) .explode( "retrieval.documents", **{"スコア": "document.score"}, ) ) expected = pd.DataFrame( { "context.span_id": ["456", "456", "456"], "document_position": [0, 1, 2], "name": ["retriever span", "retriever span", "retriever span"], "콘텐츠": ["A\n\nB\n\nC", "A\n\nB\n\nC", "A\n\nB\n\nC"], "スコア": [1, 2, 3], } ).set_index(["context.span_id", "document_position"]) async with db() as session: actual = await session.run_sync(sq, project_name="abc") assert_frame_equal( actual.sort_index().sort_index(axis=1), expected.sort_index().sort_index(axis=1), )

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Arize-ai/phoenix'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_query.py•39.6 KiB