|
|
|
|
|
|
|
|
file_bin = STORAGE_IMPL.get(bucket, name) |
|
|
file_bin = STORAGE_IMPL.get(bucket, name) |
|
|
do_layout = doc["parser_config"].get("layout_recognize", "DeepDOC") |
|
|
do_layout = doc["parser_config"].get("layout_recognize", "DeepDOC") |
|
|
pages = PdfParser.total_page_number(doc["name"], file_bin) |
|
|
pages = PdfParser.total_page_number(doc["name"], file_bin) |
|
|
|
|
|
if pages is None: |
|
|
|
|
|
pages = 0 |
|
|
page_size = doc["parser_config"].get("task_page_size") or 12 |
|
|
page_size = doc["parser_config"].get("task_page_size") or 12 |
|
|
if doc["parser_id"] == "paper": |
|
|
if doc["parser_id"] == "paper": |
|
|
page_size = doc["parser_config"].get("task_page_size") or 22 |
|
|
page_size = doc["parser_config"].get("task_page_size") or 22 |