Browser Use Heroku

test_agent_multiprocessing.py•14.3 KiB

""" Tests for parallelism and event loop handling in browser-use. Tests cover: 1. One event loop with asyncio.run and one task 2. One event loop with two different parallel agents 3. One event loop with two different sequential agents 4. Two event loops, with one agent per loop sequential 5. Two event loops, one per thread, with one agent in each loop 6. Two subprocesses, with one agent per subprocess 7. Failing test to catch asyncio.run() RuntimeError issue """ import asyncio import logging import multiprocessing from concurrent.futures import ThreadPoolExecutor import pytest from browser_use import Agent, setup_logging from browser_use.browser import BrowserProfile, BrowserSession from tests.ci.conftest import create_mock_llm # Set up test logging setup_logging() logger = logging.getLogger(__name__) def run_agent_in_subprocess_module(task_description): """Module-level function to run an agent in a subprocess""" import asyncio from browser_use import Agent # Create new event loop for this process loop = asyncio.new_event_loop() asyncio.set_event_loop(loop) async def run_agent(): # Create mock LLM inline to avoid pickling issues mock_llm = create_mock_llm() agent = Agent( task=task_description, llm=mock_llm, enable_memory=False, browser_profile=BrowserProfile(headless=True, user_data_dir=None), ) return await agent.run() try: result = loop.run_until_complete(run_agent()) has_done = False if len(result.history) > 0: last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: has_done = any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) return {'success': has_done, 'error': None} except Exception as e: return {'success': False, 'error': str(e)} finally: # Give asyncio tasks a moment to complete try: loop.run_until_complete(asyncio.sleep(0.1)) except Exception: pass # Cancel all pending tasks try: pending = asyncio.all_tasks(loop) for task in pending: task.cancel() if pending: loop.run_until_complete(asyncio.gather(*pending, return_exceptions=True)) except Exception: pass loop.stop() loop.close() class TestParallelism: """Test parallelism and event loop handling""" async def test_one_event_loop_with_asyncio_run_and_one_task(self): """Test one event loop with asyncio.run and one task""" logger.info('Testing one event loop with asyncio.run and one task') # Create mock LLM mock_llm = create_mock_llm() # Just run directly in the current event loop agent = Agent( task='Test task', llm=mock_llm, enable_memory=False, browser_profile=BrowserProfile(headless=True, user_data_dir=None), ) result = await agent.run() # Verify the agent completed successfully assert result is not None assert len(result.history) > 0 # Check that the last action was 'done' last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) @pytest.mark.skip('TODO: fix this') async def test_one_event_loop_two_parallel_agents(self): """Test one event loop with two different parallel agents""" logger.info('Testing one event loop with two parallel agents') # Create mock LLM mock_llm = create_mock_llm() # Create a shared browser session browser_session = BrowserSession( browser_profile=BrowserProfile( headless=True, user_data_dir=None, # Use temp directory keep_alive=True, ) ) try: await browser_session.start() # Create two agents that will run in parallel agent1 = Agent( task='First parallel task', llm=mock_llm, browser_session=browser_session, enable_memory=False, ) agent2 = Agent( task='Second parallel task', llm=mock_llm, browser_session=browser_session, enable_memory=False, ) # Run both agents in parallel on the same event loop results = await asyncio.gather(agent1.run(), agent2.run()) # Verify both agents completed successfully assert len(results) == 2 for result in results: assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) # Verify they share the same browser session (new behavior) assert agent1.browser_session is agent2.browser_session assert agent1.browser_session is browser_session finally: await browser_session.kill() @pytest.mark.skip('TODO: fix this') async def test_one_event_loop_two_sequential_agents(self): """Test one event loop with two different sequential agents""" logger.info('Testing one event loop with two sequential agents') # Create mock LLM mock_llm = create_mock_llm() # Create a shared browser session browser_session = BrowserSession( browser_profile=BrowserProfile( headless=True, user_data_dir=None, # Use temp directory keep_alive=True, ) ) try: await browser_session.start() # First agent agent1 = Agent( task='First sequential task', llm=mock_llm, browser_session=browser_session, enable_memory=False, ) result1 = await agent1.run() # Second agent (runs after first completes) agent2 = Agent( task='Second sequential task', llm=mock_llm, browser_session=browser_session, enable_memory=False, ) result2 = await agent2.run() # Verify both agents completed successfully for result in [result1, result2]: assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) # Verify they share the same browser session (new behavior) assert agent1.browser_session is agent2.browser_session assert agent1.browser_session is browser_session finally: await browser_session.kill() async def test_two_event_loops_sequential(self): """Test two event loops, with one agent per loop sequential""" logger.info('Testing two event loops with one agent per loop sequential') # Create mock LLM mock_llm = create_mock_llm() # Just run agents sequentially in the same event loop # This still tests sequential execution without creating new loops agent1 = Agent( task='First loop task', llm=mock_llm, enable_memory=False, browser_profile=BrowserProfile(headless=True, user_data_dir=None), ) result1 = await agent1.run() agent2 = Agent( task='Second loop task', llm=mock_llm, enable_memory=False, browser_profile=BrowserProfile(headless=True, user_data_dir=None), ) result2 = await agent2.run() # Verify both agents completed successfully for result in [result1, result2]: assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) async def test_two_event_loops_one_per_thread(self): """Test two event loops, one per thread, with one agent in each loop""" logger.info('Testing two event loops, one per thread') # Create mock LLM mock_llm = create_mock_llm() results = {} errors = {} def run_agent_in_thread(thread_name, task_description): """Run an agent in a new thread with its own event loop""" try: # Create new event loop for this thread loop = asyncio.new_event_loop() asyncio.set_event_loop(loop) async def run_agent(): agent = Agent( task=task_description, llm=mock_llm, enable_memory=False, browser_profile=BrowserProfile(headless=True, user_data_dir=None), ) return await agent.run() # Run the agent in this thread's event loop result = loop.run_until_complete(run_agent()) results[thread_name] = result except Exception as e: errors[thread_name] = e finally: # Give asyncio tasks a moment to complete try: loop.run_until_complete(asyncio.sleep(0.1)) except Exception: pass # Cancel all pending tasks try: pending = asyncio.all_tasks(loop) for task in pending: task.cancel() if pending: loop.run_until_complete(asyncio.gather(*pending, return_exceptions=True)) except Exception: pass loop.stop() loop.close() # Use run_in_executor to run threads loop = asyncio.get_event_loop() with ThreadPoolExecutor(max_workers=2) as executor: future1 = loop.run_in_executor(executor, run_agent_in_thread, 'thread1', 'Thread 1 task') future2 = loop.run_in_executor(executor, run_agent_in_thread, 'thread2', 'Thread 2 task') # Wait for both to complete await asyncio.gather(future1, future2) # Check for errors assert len(errors) == 0, f'Errors occurred: {errors}' # Verify both agents completed successfully assert len(results) == 2 for result in results.values(): assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) def test_two_subprocesses_one_agent_per_subprocess(self): """Test two subprocesses, with one agent per subprocess""" logger.info('Testing two subprocesses with one agent per subprocess') # Use multiprocessing to run agents in separate processes with multiprocessing.Pool(processes=2) as pool: tasks = ['Subprocess 1 task', 'Subprocess 2 task'] results = pool.map(run_agent_in_subprocess_module, tasks) # Verify both agents completed successfully assert len(results) == 2 for i, result in enumerate(results): assert result['error'] is None, f'Process {i} error: {result["error"]}' assert result['success'] is True @pytest.mark.skip('TODO: fix this') async def test_shared_browser_session_multiple_tabs(self): """Test multiple agents sharing same browser session with different tabs""" logger.info('Testing shared browser session with multiple tabs') # Create action sequences - each agent creates a new tab tab_action = """ { "thinking": "null", "evaluation_previous_goal": "Starting task", "memory": "Need new tab", "next_goal": "Create new tab", "action": [ { "go_to_url": { "url": "https://example.com", "new_tab": true } } ] } """ done_action = """ { "thinking": "null", "evaluation_previous_goal": "Tab created", "memory": "Task done", "next_goal": "Complete", "action": [ { "done": { "text": "Task completed", "success": true } } ] } """ # Create mocks with tab creation actions mock_llm1 = create_mock_llm([tab_action, done_action]) mock_llm2 = create_mock_llm([tab_action, done_action]) # Create shared browser session shared_session = BrowserSession( browser_profile=BrowserProfile( headless=True, user_data_dir=None, keep_alive=True, ) ) try: await shared_session.start() # Create agents sharing the session agent1 = Agent( task='Task in tab 1', llm=mock_llm1, browser_session=shared_session, enable_memory=False, ) agent2 = Agent( task='Task in tab 2', llm=mock_llm2, browser_session=shared_session, enable_memory=False, ) # Run in parallel results = await asyncio.gather(agent1.run(), agent2.run()) # Verify success for result in results: assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) # Verify multiple tabs were created tabs = await shared_session.get_tabs() assert len(tabs) >= 2 # At least 2 tabs # Verify same browser session was used assert agent1.browser_session == agent2.browser_session assert agent1.browser_session == shared_session finally: # Give playwright tasks a moment to complete before killing await asyncio.sleep(0.1) await shared_session.kill() # Give playwright.stop() time to complete cleanup await asyncio.sleep(0.1) @pytest.mark.skip('TODO: fix this') async def test_reuse_browser_session_sequentially(self): """Test reusing a browser session sequentially with keep_alive""" logger.info('Testing sequential browser session reuse') # Create mock LLM mock_llm = create_mock_llm() # Create a session with keep_alive session = BrowserSession( browser_profile=BrowserProfile( headless=True, user_data_dir=None, keep_alive=True, ) ) try: await session.start() # Get browser PID from private local_browser_watchdog initial_browser_pid = ( session._local_browser_watchdog._subprocess.pid if session._local_browser_watchdog and session._local_browser_watchdog._subprocess else None ) # First agent agent1 = Agent( task='First task', llm=mock_llm, browser_session=session, enable_memory=False, ) result1 = await agent1.run() # Session should still be alive current_browser_pid = ( session._local_browser_watchdog._subprocess.pid if session._local_browser_watchdog and session._local_browser_watchdog._subprocess else None ) assert current_browser_pid is not None assert current_browser_pid == initial_browser_pid # Second agent reusing session agent2 = Agent( task='Second task', llm=mock_llm, browser_session=session, enable_memory=False, ) result2 = await agent2.run() # Verify success and same browser for result in [result1, result2]: assert len(result.history) > 0 last_history = result.history[-1] if last_history.model_output and last_history.model_output.action: assert any('done' in action.model_dump(include={'done'}) for action in last_history.model_output.action) # Verify same browser process is still running final_browser_pid = ( session._local_browser_watchdog._subprocess.pid if session._local_browser_watchdog and session._local_browser_watchdog._subprocess else None ) assert final_browser_pid == initial_browser_pid finally: await session.kill() if __name__ == '__main__': asyncio.run(TestParallelism().test_one_event_loop_with_asyncio_run_and_one_task())

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/dsouza-anush/browser-use-heroku'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

test_agent_multiprocessing.py•14.3 KiB