baidu-ai-search

Official

Overview Schema Related Servers Score Discussions

component_check.py•19.6 KiB

import json import os import inspect from jsonschema import validate from pydantic import BaseModel from appbuilder.utils.func_utils import Singleton from appbuilder.tests.component_schemas import type_to_json_schemas from appbuilder.utils.json_schema_to_model import json_schema_to_pydantic_model class CheckInfo(BaseModel): check_rule_name: str check_result: bool check_detail: str class RuleBase(object): def __init__(self): self.invalid = False def check(self, component_cls) -> CheckInfo: raise NotImplementedError def reset_state(self): self.invalid = False class ComponentCheckBase(metaclass=Singleton): def __init__(self): self.rules = {} def register_rule(self, rule_name: str, rule_obj: RuleBase): if not isinstance(rule_obj, RuleBase): raise TypeError("rule_obj must be a subclass of RuleBase") if rule_name in self.rules: raise ValueError(f"Rule {rule_name} already exists.") self.rules[rule_name] = rule_obj def remove_rule(self, rule_name: str): del self.rules[rule_name] def notify(self, component_obj, component_case) -> tuple[bool, list]: check_pass = True check_details = {} reasons = [] for rule_name, rule_obj in self.rules.items(): if rule_name == "ToolEvalOutputJsonRule": res = rule_obj.check(component_obj, component_case) else: res = rule_obj.check(component_obj) check_details[rule_name] = res if res.check_result == False: check_pass = False reasons.append(res.check_detail) if check_pass: return True, reasons else: return False, reasons class ManifestValidRule(RuleBase): """ 通过尝试将component的manifest转换为pydantic模型来检查manifest是否符合规范 """ def __init__(self, **kwargs): super().__init__() self.rule_name = "ManifestValidRule" def check(self, component_obj) -> CheckInfo: check_pass_flag = True invalid_details = [] try: if not hasattr(component_obj, "manifests"): raise ValueError("No manifests found") manifests = component_obj.manifests # NOTE(暂时检查manifest中的第一个mainfest) if not manifests or len(manifests) == 0: raise ValueError("No manifests found") manifest = manifests[0] tool_name = manifest['name'] tool_desc = manifest['description'] schema = manifest["parameters"] schema["title"] = tool_name # 第一步，将json schema转换为pydantic模型 pydantic_model = json_schema_to_pydantic_model(schema, tool_name) check_to_json = pydantic_model.schema_json() json_to_dict = json.loads(check_to_json) if "properties" in schema: properties = schema["properties"] for key, value in properties.items(): if "type" not in value: invalid_details.append("\'type' must be in properties item: {}".format(key)) if "description" not in value: invalid_details.append("\'description' must be in properties item: {}".format(key)) except Exception as e: print(e) check_pass_flag = False invalid_details.append(str(e)) if len(invalid_details) > 0: check_pass_flag = False invalid_details = ",".join(invalid_details) else: check_pass_flag = True invalid_details = "" return CheckInfo( check_rule_name=self.rule_name, check_result=check_pass_flag, check_detail=invalid_details) Data_Type = { 'string': str, 'integer': int, 'object': int, 'array': list, 'boolean': bool, 'null': None, } class InitKwargsRule(RuleBase): def __init__(self): super().__init__() self.rule_name = "InitKwargsRule" def _accepts_kwargs(self, func): """ 检查函数是否接受 **kwargs 参数。 """ sig = inspect.signature(func) params = sig.parameters return any(p.kind == inspect.Parameter.VAR_KEYWORD for p in params.values()) def check(self, component_obj) -> CheckInfo: if not self._accepts_kwargs(component_obj.__init__): return CheckInfo( check_rule_name=self.rule_name, check_result=False, check_detail="组件的__init__初始化方法需要添加**kwargs参数" ) else: return CheckInfo( check_rule_name=self.rule_name, check_result=True, check_detail="" ) class ToolEvalKwargsRule(RuleBase): def __init__(self): super().__init__() self.rule_name = "ToolEvalKwargsRule" def _accepts_kwargs(self, func): """ 检查函数是否接受 **kwargs 参数。 """ sig = inspect.signature(func) params = sig.parameters return any(p.kind == inspect.Parameter.VAR_KEYWORD for p in params.values()) def check(self, component_obj) -> CheckInfo: if not self._accepts_kwargs(component_obj.tool_eval): return CheckInfo( check_rule_name=self.rule_name, check_result=False, check_detail="组件的__init__初始化方法需要添加**kwargs参数" ) else: return CheckInfo( check_rule_name=self.rule_name, check_result=True, check_detail="" ) class MainfestMatchToolEvalRule(RuleBase): def __init__(self): super().__init__() self.rule_name = "MainfestMatchToolEvalRule" def check(self, component_obj) -> CheckInfo: check_pass_flag = True invalid_details = [] try: if not hasattr(component_obj, "manifests"): raise ValueError("No manifests found") manifests = component_obj.manifests # NOTE(暂时检查manifest中的第一个mainfest) if not manifests or len(manifests) == 0: raise ValueError("No manifests found") manifest = manifests[0] if 'parameters' in manifest and 'properties' in manifest['parameters']: properties = manifest['parameters']['properties'] manifest_var = properties.keys() else: manifest_var = [] # 交互检查 tool_eval_input_params = [] print("required_params: {}".format(manifest_var)) signature = inspect.signature(component_obj.tool_eval) ileagal_params = [] for param_name, param in signature.parameters.items(): if param_name == 'kwargs' or param_name == 'args' or param_name == 'self': continue tool_eval_input_params.append(param_name) if param_name not in manifest_var: check_pass_flag = False ileagal_params.append(param_name) if len(ileagal_params) > 0: invalid_details.append("tool_eval 参数 {} 不在 mainfest 参数列表中".format(",".join(ileagal_params))) ileagal_params =[] for required_param in manifest_var: if required_param not in tool_eval_input_params: check_pass_flag = False ileagal_params.append(required_param) if len(ileagal_params) > 0: invalid_details.append("mainfest 参数 {} 不在 tool_eval 参数列表中".format(",".join(ileagal_params))) return CheckInfo( check_rule_name=self.rule_name, check_result=check_pass_flag, check_detail=",".join(invalid_details)) except Exception as e: check_pass_flag = False invalid_details.append(str(e)) return CheckInfo( check_rule_name=self.rule_name, check_result=check_pass_flag, check_detail=",".join(invalid_details)) class ToolEvalInputNameRule(RuleBase): """ 检查tool_eval的输入参数中，是否包含系统保留的输入名称 """ def __init__(self): super().__init__() self.rule_name = 'ToolEvalInputNameRule' self.system_input_name = [ "_sys_name", "_sys_origin_query", "_sys_user_instruction", "_sys_file_names", "_sys_file_urls", "_sys_current_time", "_sys_chat_history", "_sys_used_tool", "_sys_uid", "_sys_traceid", "_sys_conversation_id", "_sys_gateway_endpoint", "_sys_appbuiler_token", "_sys_debug", "_sys_custom_variables", "_sys_thought_model_config", "_sys_rag_model_config", "_sys_parent_span_id", "_sys_span_id", "_sys_memory", "_sys_code_execution_endpoint", "_sys_session_id" ] def check(self, component_obj) -> CheckInfo: tool_eval_signature = inspect.signature(component_obj.tool_eval) params = tool_eval_signature.parameters invalid_details = [] check_pass_flag = True for param_name in params: if param_name == 'self': continue if param_name in self.system_input_name: invalid_details.append(param_name) check_pass_flag = False return CheckInfo( check_rule_name=self.rule_name, check_result=check_pass_flag, check_detail="以下ToolEval方法参数名称是系统保留字段，请更换：{}".format("，".join(invalid_details)) if len(invalid_details) > 0 else "") class ToolEvalOutputJsonRule(RuleBase): """ 检查tool_eval的输出结果是否符合对应的json schema """ def __init__(self, **kwargs): super().__init__() self.rule_name = 'ToolEvalOutputJsonRule' def _check_pre_format(self, outputs): invalid_details = [] if "content" not in outputs: invalid_details.append("ToolEval返回值不符合规范：返回内容缺少content") return invalid_details for content in outputs["content"]: if "type" not in content: invalid_details.append("ToolEval返回值不符合规范：返回content缺少type") break out_type = content["type"] if out_type not in type_to_json_schemas: invalid_details.append("ToolEval返回值不符合JSON Schema：返回content.type={} 不是合法的输出类型".format(out_type)) break return invalid_details def _check_jsonschema(self, outputs, output_schemas): """检查输出格式是否符合对应的json schema """ invalid_details = [] if len(self._check_pre_format(outputs)) > 0 : return invalid_details for content in outputs["content"]: out_type = content["type"] out_schema = type_to_json_schemas[out_type] if out_schema not in output_schemas: invalid_details.append("ToolEval返回值不符合JSON Schema：{} 不是该组件期望的Json Schema输出类型".format(out_schema['$schema'])) continue try: validate(instance=content, schema=out_schema) except Exception as e: invalid_details.append("ToolEval返回值不符合JSON Schema: {}\n".format(e.message)) return invalid_details def _gather_iter_outputs(self, outputs): text_output = "" oral_text_output = "" code_output = "" for content in outputs.content: out_type = content.type if out_type == "text": text_output += content.text.info elif out_type == "oral_text": oral_text_output += content.text.info elif out_type == "code": code_output += content.text.code return { "text": text_output, "oral_text": oral_text_output, "code": code_output, } def _check_text_and_code(self, component_case, output_dict): """检查输出的内容是否符合预期，只检查text(包含oral_text)和code """ if not hasattr(component_case,"outputs"): return [] expected_output = component_case.outputs() expected_output_texts = [] expected_output_oral_texts = [] expected_output_codes = [] if "text" in expected_output: expected_output_texts = expected_output["text"] if "oral_text" in expected_output: expected_output_oral_texts = expected_output["oral_text"] if "code" in expected_output: expected_output_codes = expected_output["code"] lost_texts = [] lost_oral_texts = [] lost_code = [] for expected_output_text in expected_output_texts: if expected_output_text not in output_dict["text"]: lost_texts.append(expected_output_text) for expected_output_oral_text in expected_output_oral_texts: if expected_output_oral_text not in output_dict["oral_text"]: lost_oral_texts.append(expected_output_oral_text) for expected_output_code in expected_output_codes: if expected_output_code not in output_dict["code"]: lost_code.append(expected_output_code) error_message = "" if len(lost_texts) > 0: error_message += "应包含text:{}".format(", ".join(lost_texts)) if len(lost_oral_texts) > 0: error_message += "应包含oral_text:{}".format(", ".join(lost_oral_texts)) if len(lost_code) > 0: error_message += "应包含code:{}".format(", ".join(lost_code)) if error_message != "": return ["ToolEval返回内容与预期不符: " + error_message] else: return [] def check(self, component_obj, component_case) -> CheckInfo: invalid_details = [] input_dict = component_case.inputs() output_json_schemas = component_case.schemas() try: stream_output_dict = {"text": "", "oral_text":"", "code": ""} stream_outputs = component_obj.tool_eval(**input_dict) for stream_output in stream_outputs: iter_invalid_detail = self._check_jsonschema(stream_output.model_dump(), output_json_schemas) invalid_details.extend(iter_invalid_detail) iter_output_dict = self._gather_iter_outputs(stream_output) stream_output_dict["text"] += iter_output_dict["text"] stream_output_dict["oral_text"] += iter_output_dict["oral_text"] stream_output_dict["code"] += iter_output_dict["code"] if len(invalid_details) == 0: invalid_details.extend(self._check_text_and_code(component_case, stream_output_dict)) except Exception as e: invalid_details.append("ToolEval执行失败: {}".format(e)) if len(invalid_details) > 0: return CheckInfo( check_rule_name=self.rule_name, check_result=False, check_detail=",".join(invalid_details)) else: return CheckInfo( check_rule_name=self.rule_name, check_result=True, check_detail="") def register_component_check_rule(rule_name: str, rule_cls: RuleBase): component_checker = ComponentCheckBase() component_checker.register_rule(rule_name, rule_cls()) def check_component_with_retry(component_import_res_tuple): """ 使用重试机制检查组件。测试用例失败后会重试两次。 Args: component_import_res_tuple (tuple): 包含组件和导入结果的元组。 Returns: list: 包含错误信息的数据列表。 """ component, import_res, component_case_cls = component_import_res_tuple component_check_base = ComponentCheckBase() if inspect.isclass(component): component_name = component.__name__ else: component_name = component error_data = [] max_retries = 2 # 设置最大重试次数 attempts = 0 while attempts <= max_retries: if import_res["import_error"] != "": error_data.append({"Component Name": component_name, "Error Message": import_res["import_error"]}) print("组件名称:{} 错误信息:{}".format(component_name, import_res["import_error"])) break component_case = component_case_cls() envs = component_case.envs() os.environ.update(envs) component_cls = import_res["obj"] component_obj = component_cls(**component_case.init_args()) try: # 此处的self.component_check_base.notify需要根据实际情况修改 pass_check, reasons = component_check_base.notify(component_obj, component_case) # 示例修改 reasons = list(set(reasons)) if not pass_check: error_data.append({"Component Name": component_name, "Error Message": ", ".join(reasons)}) print("组件名称:{} 错误信息:{}".format(component_name, ", ".join(reasons))) # 如果检查失败，增加尝试次数并重试 attempts += 1 if attempts <= max_retries: print("组件名称:{} 将重试，当前尝试次数:{}".format(component_name, attempts)) continue # 如果检查通过，则退出循环 break except Exception as e: error_data.append({"Component Name": component_name, "Error Message": str(e)}) print("组件名称:{} 错误信息:{}".format(component_name, str(e))) # 如果发生异常，增加尝试次数并重试 attempts += 1 if attempts <= max_retries: print("组件名称:{} 将重试，当前尝试次数:{}".format(component_name, attempts)) continue finally: for env in envs: os.environ.pop(env) return error_data def write_error_data(txt_file_path, error_df, error_stats): """将组件错误信息写入文件 Args: error_df (Union[pd.DataFrame, None]): 错误信息表格 error_stats (dict): 错误统计信息 """ with open(txt_file_path, 'w') as file: file.write("Component Name\tError Message\n") for _, row in error_df.iterrows(): file.write(f"{row['Component Name']}\t{row['Error Message']}\n") file.write("\n错误统计信息:\n") for error, count in error_stats.items(): file.write(f"错误信息: {error}, 出现次数: {count}\n") print(f"\n错误信息已写入: {txt_file_path}") register_component_check_rule("ManifestValidRule", ManifestValidRule) register_component_check_rule("MainfestMatchToolEvalRule", MainfestMatchToolEvalRule) register_component_check_rule("ToolEvalInputNameRule", ToolEvalInputNameRule) register_component_check_rule("ToolEvalOutputJsonRule", ToolEvalOutputJsonRule) register_component_check_rule("InitKwargsRule", InitKwargsRule) register_component_check_rule("ToolEvalKwargsRule", ToolEvalKwargsRule)

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/baidubce/app-builder'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

component_check.py•19.6 KiB