from pathlib import Path
from dingo.config import InputArgs
from dingo.exec import Executor
# 获取项目根目录
PROJECT_ROOT = Path(__file__).parent.parent.parent
if __name__ == '__main__':
input_data = {
"input_path": str(PROJECT_ROOT / "test/data/test_document_OCR_recognize.jsonl"),
"dataset": {
"source": "local",
"format": "jsonl",
"field": {
"id": "id",
"content": "pred_content",
"image": "pred_bbox_image",
}
},
"executor": {
"prompt_list": ["PromptMinerURecognizeTrainQuality"],
"result_save": {
"bad": True,
"good": True
}
},
"evaluator": {
"llm_config": {
"LLMMinerURecognizeQuality": {
"model": "gemini-2.5-pro",
"key": "",
"api_url": ""
}
}
}
}
input_args = InputArgs(**input_data)
executor = Executor.exec_map["local"](input_args)
result = executor.execute()
print(result)