@arizeai/phoenix-mcp

Official

227

7,296

Overview InspectNew Endpoints Schema Related Servers Reviews Score

test_timeseries.py•12.8 kB

from datetime import timedelta from io import StringIO from typing import NamedTuple, Union, cast import numpy as np import numpy.typing as npt import pandas as pd from phoenix.core.model_schema import Column from phoenix.metrics import Metric from phoenix.metrics.metrics import CountNotNull, EuclideanDistance, Mean, VectorMean, VectorSum from phoenix.metrics.timeseries import timeseries def txt2arr(s: str) -> Union[float, npt.NDArray[np.float64]]: if isinstance(s, str) and len(s) > 1 and s[0] == "[" and s[-1] == "]": return np.array(s[1:-1].split(), dtype=float) return float(s) reference_data = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-01 11:50:52Z,0,839,A,[1 2 3 4 5] 2023-01-01 11:50:53Z,0,nan,A,nan 2023-01-07 00:46:53Z,1,895,B,[2 3 4 5 6] 2023-01-07 00:46:54Z,1,nan,B,nan 2023-01-08 20:22:47Z,2,382,A,[3 4 5 6 7] 2023-01-08 20:22:48Z,2,nan,A,nan 2023-01-10 09:37:54Z,3,276,B,[4 5 6 7 8] 2023-01-10 09:37:55Z,3,nan,B,nan 2023-01-15 11:56:26Z,4,875,A,[5 6 7 8 9] """ ), names=["ts", "index", "x", "y", "v"], parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"v": txt2arr}, ) MetricTest = NamedTuple("MetricTest", [("name", str), ("metric", Metric)]) metric_tests = ( MetricTest("Mean(x)", Mean(operand=Column("x"))), MetricTest("CountNotNull(x)", CountNotNull(operand=Column("x"))), MetricTest("VectorSum(v)", VectorSum(operand=Column("v"), shape=5)), MetricTest("VectorMean(v)", VectorMean(operand=Column("v"), shape=5)), MetricTest( "EuclideanDistance(v)", EuclideanDistance( operand=Column("v"), shape=5, reference_data=reference_data, ), ), ) names = list(map(lambda t: t.name, metric_tests)) metrics = list(map(lambda t: t.metric, metric_tests)) start = pd.to_datetime("2023-01-01 11:50:52Z") stop = pd.to_datetime("2023-01-28 11:26:50Z") # end instant is exclusive # The `index` column is added here because it can be a common occurrence in # dataframes read from csv files, and it will confuse `pandas.DataFrame.query()` # when index filtering is attempted, so it's a good edge case for testing. data = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-01 11:50:52Z,0,839,A,[1 2 3 4 5] 2023-01-01 11:50:53Z,0,nan,A,nan 2023-01-07 00:46:53Z,1,895,B,[2 3 4 5 6] 2023-01-07 00:46:54Z,1,nan,B,nan 2023-01-08 20:22:47Z,2,382,A,[3 4 5 6 7] 2023-01-08 20:22:48Z,2,nan,A,nan 2023-01-10 09:37:54Z,3,276,B,[4 5 6 7 8] 2023-01-10 09:37:55Z,3,nan,B,nan 2023-01-15 11:56:26Z,4,875,A,[5 6 7 8 9] 2023-01-15 11:56:27Z,4,nan,A,nan 2023-01-18 21:13:50Z,5,954,B,[6 7 8 9 10] 2023-01-18 21:13:51Z,5,nan,B,nan 2023-01-21 05:23:50Z,6,750,A,[7 8 9 10 11] 2023-01-21 05:23:51Z,6,nan,A,nan 2023-01-22 00:24:26Z,7,267,B,[8 9 10 11 12] 2023-01-22 00:24:27Z,7,nan,B,nan 2023-01-28 06:52:08Z,8,642,A,[9 10 11 12 13] 2023-01-28 06:52:09Z,8,nan,A,nan 2023-01-28 11:26:50Z,9,446,B,[10 11 12 13 14] """ ), names=["ts", "index", "x", "y", "v"], parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"v": txt2arr}, ) def test_timeseries_durational_granularity() -> None: actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=timedelta(hours=72), sampling_interval=timedelta(hours=24), ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-02 11:26:50Z,839.,1,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-03 11:26:50Z,839.,1,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-04 11:26:50Z,839.,1,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-05 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-06 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-07 11:26:50Z,895.,1,[2. 3. 4. 5. 6.],[2. 3. 4. 5. 6.],2.23607 2023-01-08 11:26:50Z,895.,1,[2. 3. 4. 5. 6.],[2. 3. 4. 5. 6.],2.23607 2023-01-09 11:26:50Z,638.5,2,[5. 7. 9. 11. 13.],[2.5 3.5 4.5 5.5 6.5],1.11803 2023-01-10 11:26:50Z,329.,2,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-11 11:26:50Z,329.,2,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-12 11:26:50Z,276.,1,[4. 5. 6. 7. 8.],[4. 5. 6. 7. 8.],2.23607 2023-01-13 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-14 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-15 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-16 11:26:50Z,875.,1,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-17 11:26:50Z,875.,1,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-18 11:26:50Z,875.,1,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-19 11:26:50Z,954.,1,[6. 7. 8. 9. 10.],[6. 7. 8. 9. 10.],6.70820 2023-01-20 11:26:50Z,954.,1,[6. 7. 8. 9. 10.],[6. 7. 8. 9. 10.],6.70820 2023-01-21 11:26:50Z,852.,2,[13. 15. 17. 19. 21.],[6.5 7.5 8.5 9.5 10.5],7.82624 2023-01-22 11:26:50Z,508.5,2,[15. 17. 19. 21. 23.],[7.5 8.5 9.5 10.5 11.5],10.06231 2023-01-23 11:26:50Z,508.5,2,[15. 17. 19. 21. 23.],[7.5 8.5 9.5 10.5 11.5],10.06231 2023-01-24 11:26:50Z,267.,1,[8. 9. 10. 11. 12.],[8. 9. 10. 11. 12.],11.18034 2023-01-25 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-26 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-27 11:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-28 11:26:50Z,642.,1,[9. 10. 11. 12. 13.],[9. 10. 11. 12. 13.],13.41641 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=timedelta(hours=72), sampling_interval=timedelta(hours=48), ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-02 11:26:50Z,839.,1.,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-04 11:26:50Z,839.,1.,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-08 11:26:50Z,895.,1.,[2. 3. 4. 5. 6.],[2. 3. 4. 5. 6.],2.23607 2023-01-10 11:26:50Z,329.,2.,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-12 11:26:50Z,276.,1.,[4. 5. 6. 7. 8.],[4. 5. 6. 7. 8.],2.23607 2023-01-16 11:26:50Z,875.,1.,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-18 11:26:50Z,875.,1.,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-20 11:26:50Z,954.,1.,[6. 7. 8. 9. 10.],[6. 7. 8. 9. 10.],6.70820 2023-01-22 11:26:50Z,508.5,2.,[15. 17. 19. 21. 23.],[7.5 8.5 9.5 10.5 11.5],10.06231 2023-01-24 11:26:50Z,267.,1.,[8. 9. 10. 11. 12.],[8. 9. 10. 11. 12.],11.18034 2023-01-28 11:26:50Z,642.,1.,[9. 10. 11. 12. 13.],[9. 10. 11. 12. 13.],13.41641 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=timedelta(hours=100), sampling_interval=timedelta(hours=99), ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-03 17:26:50Z,839.,1,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-07 20:26:50Z,895.,1,[2. 3. 4. 5. 6.],[2. 3. 4. 5. 6.],2.23607 2023-01-11 23:26:50Z,329.,2,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-16 02:26:50Z,875.,1,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-20 05:26:50Z,954.,1,[6. 7. 8. 9. 10.],[6. 7. 8. 9. 10.],6.70820 2023-01-24 08:26:50Z,508.5,2,[15. 17. 19. 21. 23.],[7.5 8.5 9.5 10.5 11.5],10.06231 2023-01-28 11:26:50Z,642.,1,[9. 10. 11. 12. 13.],[9. 10. 11. 12. 13.],13.41641 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=timedelta(hours=100), sampling_interval=timedelta(hours=396), ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-11 23:26:50Z,329.,2,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-28 11:26:50Z,642.,1,[9. 10. 11. 12. 13.],[9. 10. 11. 12. 13.],13.41641 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) def test_timeseries_simple_granularity() -> None: actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=timedelta(hours=80), sampling_interval=timedelta(hours=80), ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-01 19:26:50Z,839.,1,[1. 2. 3. 4. 5.],[1. 2. 3. 4. 5.],4.47214 2023-01-05 03:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-08 11:26:50Z,895.,1,[2. 3. 4. 5. 6.],[2. 3. 4. 5. 6.],2.23607 2023-01-11 19:26:50Z,329.,2,[7. 9. 11. 13. 15.],[3.5 4.5 5.5 6.5 7.5],1.11803 2023-01-15 03:26:50Z,nan,0,[0. 0. 0. 0. 0.],nan,nan 2023-01-18 11:26:50Z,875.,1,[5. 6. 7. 8. 9.],[5. 6. 7. 8. 9.],4.47214 2023-01-21 19:26:50Z,852.,2,[13. 15. 17. 19. 21.],[6.5 7.5 8.5 9.5 10.5],7.82624 2023-01-25 03:26:50Z,267.,1,[8. 9. 10. 11. 12.],[8. 9. 10. 11. 12.],11.18034 2023-01-28 11:26:50Z,642.,1,[9. 10. 11. 12. 13.],[9. 10. 11. 12. 13.],13.41641 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) def test_timeseries_all_granularity() -> None: actual = data.pipe( timeseries( start_time=start, end_time=stop, evaluation_window=stop - start, sampling_interval=stop - start, ), metrics=metrics, ) expected = pd.read_csv( # type: ignore[call-overload] StringIO( """ 2023-01-28 11:26:50Z,653.3333333333334,9,[45. 54. 63. 72. 81.],[5. 6. 7. 8. 9.],4.472135955 """ ), names=["ts"] + names, parse_dates=["ts"], date_parser=pd.to_datetime, index_col="ts", converters={"VectorSum(v)": txt2arr, "VectorMean(v)": txt2arr}, ) compare(expected.round(4), actual.round(4)) def test_timeseries_empty_result() -> None: compare( pd.DataFrame(), data.pipe( timeseries( start_time=stop, end_time=start, evaluation_window=stop - start, sampling_interval=stop - start, ), metrics=metrics, ), ) def compare(expected: pd.DataFrame, actual: pd.DataFrame) -> None: assert len(expected) >= len(actual) for timestamp, row in expected.iterrows(): try: row_id = cast(int, actual.index.get_loc(timestamp)) result = actual.iloc[row_id, :].to_dict() except KeyError: result = {} for test in metric_tests: assert np.allclose( row.loc[test.name], test.metric.get_value(result), equal_nan=True, )

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/Arize-ai/phoenix'

If you have feedback or need assistance with the MCP directory API, please join our Discord server