ishika_mcp

test_litellm_async.py•4.56 KiB

"""Tests for LiteLLM fallback async completion functionality.""" import pytest import tiktoken from crewai.llm import LLM @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_basic_call(): """Test basic async call with LiteLLM fallback.""" llm = LLM(model="gpt-4o-mini", is_litellm=True) result = await llm.acall("Say hello") assert result is not None assert isinstance(result, str) assert len(result) > 0 @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_with_temperature(): """Test async call with temperature parameter.""" llm = LLM(model="gpt-4o-mini", is_litellm=True, temperature=0.1) result = await llm.acall("Say the word 'test' once") assert result is not None assert isinstance(result, str) @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_with_max_tokens(): """Test async call with max_tokens parameter.""" llm = LLM(model="gpt-4o-mini", is_litellm=True, max_tokens=10) result = await llm.acall("Write a very long story about a dragon.") assert result is not None assert isinstance(result, str) encoder = tiktoken.get_encoding("cl100k_base") token_count = len(encoder.encode(result)) assert token_count <= 10 @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_with_system_message(): """Test async call with system message.""" llm = LLM(model="gpt-4o-mini", is_litellm=True) messages = [ {"role": "system", "content": "You are a helpful assistant."}, {"role": "user", "content": "What is 2+2?"}, ] result = await llm.acall(messages) assert result is not None assert isinstance(result, str) @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_conversation(): """Test async call with conversation history.""" llm = LLM(model="gpt-4o-mini", is_litellm=True) messages = [ {"role": "user", "content": "My name is Alice."}, {"role": "assistant", "content": "Hello Alice! Nice to meet you."}, {"role": "user", "content": "What is my name?"}, ] result = await llm.acall(messages) assert result is not None assert isinstance(result, str) @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_multiple_calls(): """Test making multiple async calls in sequence.""" llm = LLM(model="gpt-4o-mini", is_litellm=True) result1 = await llm.acall("What is 1+1?") result2 = await llm.acall("What is 2+2?") assert result1 is not None assert result2 is not None assert isinstance(result1, str) assert isinstance(result2, str) @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_with_parameters(): """Test async call with multiple parameters.""" llm = LLM( model="gpt-4o-mini", is_litellm=True, temperature=0.7, max_tokens=100, top_p=0.9, frequency_penalty=0.5, presence_penalty=0.3, ) result = await llm.acall("Tell me a short fact") assert result is not None assert isinstance(result, str) @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_streaming(): """Test async streaming call with LiteLLM fallback.""" llm = LLM(model="gpt-4o-mini", is_litellm=True, stream=True) result = await llm.acall("Say hello world") assert result is not None assert isinstance(result, str) assert len(result) > 0 @pytest.mark.asyncio @pytest.mark.vcr @pytest.mark.skip(reason="cassettes do not read properly but were generated correctly.") async def test_litellm_async_streaming_with_parameters(): """Test async streaming call with multiple parameters.""" llm = LLM( model="gpt-4o-mini", is_litellm=True, stream=True, temperature=0.5, max_tokens=50, ) result = await llm.acall("Count from 1 to 5") assert result is not None assert isinstance(result, str)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/crewAIInc/crewAI'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_litellm_async.py•4.56 KiB