document_parsing_quality_ocr.py•984 B
from dingo.config import InputArgs
from dingo.exec import Executor
if __name__ == '__main__':
input_data = {
"input_path": "../../test/data/test_document_OCR_recognize.jsonl",
"dataset": {
"source": "local",
"format": "jsonl",
"field": {
"id": "id",
"content": "pred_content",
"prompt": "gt_markdown",
}
},
"executor": {
"prompt_list": ["PromptMinerURecognizeQuality"],
"result_save": {
"bad": True,
"good": True
}
},
"evaluator": {
"llm_config": {
"LLMMinerURecognizeQuality": {
"key": "",
"api_url": "",
}
}
}
}
input_args = InputArgs(**input_data)
executor = Executor.exec_map["local"](input_args)
result = executor.execute()
print(result)