Skip to main content
Glama

baidu-ai-search

Official
by baidubce
test_v2_general_ocr.py5.26 kB
# Copyright (c) 2024 Baidu, Inc. All Rights Reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. import os import requests import base64 import unittest import appbuilder from appbuilder.core.components.v2 import GeneralOCR from appbuilder.core.component import ComponentOutput from appbuilder.core._exception import InvalidRequestArgumentError @unittest.skipUnless(os.getenv("TEST_CASE", "UNKNOWN") == "CPU_PARALLEL", "") class TestGeneralOCR(unittest.TestCase): def setUp(self) -> None: self.com = GeneralOCR() def test_run(self): img_url = "https://bj.bcebos.com/v1/appbuilder/general_ocr_test.png?" \ "authorization=bce-auth-v1%2FALTAKGa8m4qCUasgoljdEDAzLm%2F2024-01-" \ "11T10%3A59%3A17Z%2F-1%2Fhost%2F081bf7bcccbda5207c82a4de074628b04ae" \ "857a27513734d765495f89ffa5f73" raw_image = requests.get(img_url).content image_base64 = base64.b64encode(raw_image) message = appbuilder.Message(content={"image_base64": image_base64}) output = self.com.run(message) print(output) def test_tool_eval(self): img_url = "https://bj.bcebos.com/v1/appbuilder/general_ocr_test.png?" \ "authorization=bce-auth-v1%2FALTAKGa8m4qCUasgoljdEDAzLm%2F2024-01-" \ "11T10%3A59%3A17Z%2F-1%2Fhost%2F081bf7bcccbda5207c82a4de074628b04ae" \ "857a27513734d765495f89ffa5f73" img_names = ["general_ocr_test.png", "test"] img_urls = [ "https://agi-dev-platform-file.bj.bcebos.com/files_qa/10b495b5ceea44e5a1e7d194f3a59ed7/uploads/file-6cxezmhc_1.jpeg?authorization=bce-auth-v1%2FALTAKGa8m4qCUasgoljdEDAzLm%2F2025-08-04T03%3A27%3A03Z%2F259200%2Fhost%2Ff420874be9fe2511a73eab458339aad110d97c55742b14fb4fabf78cc0e1d4cc", "https://agi-dev-platform-file.bj.bcebos.com/files_qa/10b495b5ceea44e5a1e7d194f3a59ed7/uploads/file-wjka6g3h_%E5%BC%80%E6%88%B7%E8%AE%B8%E5%8F%AF%E8%AF%81.jpeg?authorization=bce-auth-v1%2FALTAKGa8m4qCUasgoljdEDAzLm%2F2025-08-04T03%3A28%3A23Z%2F259200%2Fhost%2F2e3355869d9f62143051a12c2b19bc39b33d439e18839fe6dd15d0f37ab3a999"] pdf_urls = ["https://agi-dev-platform-file.bj.bcebos.com/files_qa/10b495b5ceea44e5a1e7d194f3a59ed7/uploads/file-hf7nhtdw_8_%E8%B4%A8%E9%87%8F%E6%B5%81%E9%87%8F%E8%AE%A1-1.pdf?authorization=bce-auth-v1%2FALTAKGa8m4qCUasgoljdEDAzLm%2F2025-08-04T03%3A22%3A29Z%2F259200%2Fhost%2Fd1e301ba51cbe39fbbe10a334c5e4f75d71b40522916e25205e83404b6cea791"] result = self.com.tool_eval(img_names=img_names, img_urls=img_urls, pdf_urls=pdf_urls, _sys_file_urls={'general_ocr_test.png': img_url}) for res in result: assert isinstance(res, ComponentOutput) print(res.content) def test_error_tool_eval(self): result = self.com.tool_eval(img_url='', img_name='') with self.assertRaises(InvalidRequestArgumentError): list(result) result = self.com.tool_eval(img_url='', img_name='test.jpg') with self.assertRaises(InvalidRequestArgumentError): list(result) def test_run_pdf_base64(self): pdf_url = "https://bj.bcebos.com/agi-dev-platform-sdk-test/8、质量流量计.pdf" raw_pdf = requests.get(pdf_url).content pdf_base64 = base64.b64encode(raw_pdf) general_ocr = GeneralOCR() out = general_ocr.run(appbuilder.Message(content={"pdf_base64": pdf_base64, "pdf_file_num": "3"})) self.assertIsInstance(out, appbuilder.Message) def test_run_pdf_url(self): pdf_url = "https://bj.bcebos.com/agi-dev-platform-sdk-test/8、质量流量计.pdf" general_ocr = GeneralOCR() out = general_ocr.run(appbuilder.Message(content={"pdf_url": pdf_url, "pdf_file_num": "5"})) self.assertIsInstance(out, appbuilder.Message) def test_tool_eval_pdf_url(self): pdf_url = "https://bj.bcebos.com/agi-dev-platform-sdk-test/8、质量流量计.pdf" result = self.com.tool_eval(pdf_urls=[pdf_url]) for iter in result: self.assertIsInstance(iter, ComponentOutput) def test_tool_eval_none_input(self): result = self.com.tool_eval(pdf_name="test.pdf") with self.assertRaises(InvalidRequestArgumentError): list(result) def test_rotated_image(self): image_url = "https://bj.bcebos.com/agi-dev-platform-sdk-test/8、质量流量计-1_rotated_page-0001.jpg" out = self.com.run(appbuilder.Message(content={ "image_url": image_url, "detect_direction": "true", "multidirectional_recognize": "false"} )) self.assertIsInstance(out, appbuilder.Message) if __name__ == "__main__": unittest.main()

Latest Blog Posts

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/baidubce/app-builder'

If you have feedback or need assistance with the MCP directory API, please join our Discord server