TxtAI MCP Server

Overview Schema Related Servers Score Discussions

testonnx.py•4.82 KiB

""" ONNX module tests """ import os import tempfile import unittest from unittest.mock import patch from sklearn.feature_extraction.text import TfidfVectorizer from sklearn.linear_model import LogisticRegression from sklearn.pipeline import Pipeline from txtai.embeddings import Embeddings from txtai.models import OnnxModel from txtai.pipeline import HFOnnx, HFTrainer, Labels, MLOnnx, Questions class TestOnnx(unittest.TestCase): """ ONNX tests. """ @classmethod def setUpClass(cls): """ Create default datasets. """ cls.data = [{"text": "Dogs", "label": 0}, {"text": "dog", "label": 0}, {"text": "Cats", "label": 1}, {"text": "cat", "label": 1}] * 100 def testDefault(self): """ Test exporting an ONNX model with default parameters """ # Export model to ONNX, use default parameters onnx = HFOnnx() model = onnx("google/bert_uncased_L-2_H-128_A-2") # Validate model has data self.assertGreater(len(model), 0) # Validate model device properly works self.assertEqual(OnnxModel(model).device, -1) def testClassification(self): """ Test exporting a classification model to ONNX and running inference """ path = "google/bert_uncased_L-2_H-128_A-2" trainer = HFTrainer() model, tokenizer = trainer(path, self.data) # Output file path output = os.path.join(tempfile.gettempdir(), "onnx") # Export model to ONNX onnx = HFOnnx() model = onnx((model, tokenizer), "text-classification", output, True) # Test classification labels = Labels((model, path), dynamic=False) self.assertEqual(labels("cat")[0][0], 1) @patch("onnxruntime.get_available_providers") @patch("torch.cuda.is_available") def testPooling(self, cuda, providers): """ Test exporting a pooling model to ONNX and running inference """ path = "sentence-transformers/paraphrase-MiniLM-L3-v2" # Export model to ONNX onnx = HFOnnx() model = onnx(path, "pooling", quantize=True) # Test no CUDA and onnxruntime installed cuda.return_value = False providers.return_value = ["CPUExecutionProvider"] embeddings = Embeddings({"path": model, "tokenizer": path}) self.assertEqual(embeddings.similarity("animal", ["dog", "book", "rug"])[0][0], 0) # Test no CUDA and onnxruntime-gpu installed cuda.return_value = False providers.return_value = ["CUDAExecutionProvider", "CPUExecutionProvider"] embeddings = Embeddings({"path": model, "tokenizer": path}) self.assertIsNotNone(embeddings) # Test CUDA and only onnxruntime installed cuda.return_value = True providers.return_value = ["CPUExecutionProvider"] embeddings = Embeddings({"path": model, "tokenizer": path}) self.assertIsNotNone(embeddings) # Test CUDA and onnxruntime-gpu installed cuda.return_value = True providers.return_value = ["CUDAExecutionProvider", "CPUExecutionProvider"] embeddings = Embeddings({"path": model, "tokenizer": path}) self.assertIsNotNone(embeddings) def testQA(self): """ Test exporting a QA model to ONNX and running inference """ path = "distilbert-base-cased-distilled-squad" # Export model to ONNX onnx = HFOnnx() model = onnx(path, "question-answering") questions = Questions((model, path)) self.assertEqual(questions(["What is the price?"], ["The price is $30"])[0], "$30") def testScikit(self): """ Test exporting a scikit-learn model to ONNX and running inference """ # pylint: disable=W0613 def tokenizer(inputs, **kwargs): if isinstance(inputs, str): inputs = [inputs] return {"input_ids": [[x] for x in inputs]} # Train a scikit-learn model model = Pipeline([("tfidf", TfidfVectorizer()), ("lr", LogisticRegression())]) model.fit([x["text"] for x in self.data], [x["label"] for x in self.data]) # Export model to ONNX onnx = MLOnnx() model = onnx(model) # Test classification labels = Labels((model, tokenizer), dynamic=False) self.assertEqual(labels("cat")[0][0], 1) def testZeroShot(self): """ Test exporting a zero shot classification model to ONNX and running inference """ path = "prajjwal1/bert-medium-mnli" # Export model to ONNX onnx = HFOnnx() model = onnx(path, "zero-shot-classification", quantize=True) # Test zero shot classification labels = Labels((model, path)) self.assertEqual(labels("That is great news", ["negative", "positive"])[0][0], 1)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/neuml/txtai'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

testonnx.py•4.82 KiB