{"id":"https://openalex.org/W7162145642","doi":"https://doi.org/10.48550/arxiv.2605.22100","title":"MPDocBench-Parse: Benchmarking Practical Multi-page Document Parsing","display_name":"MPDocBench-Parse: Benchmarking Practical Multi-page Document Parsing","publication_year":2026,"publication_date":"2026-05-21","ids":{"openalex":"https://openalex.org/W7162145642","doi":"https://doi.org/10.48550/arxiv.2605.22100"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.22100","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.22100","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.22100","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044029978","display_name":"Bangbang Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Bangbang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039720488","display_name":"Hangdi Xing","orcid":"https://orcid.org/0000-0002-1770-005X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xing, Hangdi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136768444","display_name":"Yifan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yifan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136756672","display_name":"Jianjun Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jianjun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136738308","display_name":"Qi Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038757890","display_name":"Feiyu Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Feiyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136785407","display_name":"Zhibo Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Zhibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136745928","display_name":"Shuai Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Shuai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136751119","display_name":"Ming Yan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan, Ming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136811954","display_name":"Jieping Ye","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ye, Jieping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136736474","display_name":"Hongtao Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Hongtao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.7928000092506409,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.7928000092506409,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.05209999904036522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.04520000144839287,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7657999992370605},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.5329999923706055},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4828000068664551},{"id":"https://openalex.org/keywords/document-structure-description","display_name":"Document Structure Description","score":0.4729999899864197},{"id":"https://openalex.org/keywords/well-formed-document","display_name":"Well-formed document","score":0.46320000290870667},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.45010000467300415},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4352000057697296},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.39480000734329224},{"id":"https://openalex.org/keywords/document-processing","display_name":"Document processing","score":0.34119999408721924},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.33820000290870667}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8518000245094299},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7657999992370605},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5849000215530396},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5509999990463257},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.5329999923706055},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.505299985408783},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4828000068664551},{"id":"https://openalex.org/C68699486","wikidata":"https://www.wikidata.org/wiki/Q265904","display_name":"Document Structure Description","level":3,"score":0.4729999899864197},{"id":"https://openalex.org/C137441365","wikidata":"https://www.wikidata.org/wiki/Q7981054","display_name":"Well-formed document","level":5,"score":0.46320000290870667},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.45010000467300415},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4352000057697296},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.39480000734329224},{"id":"https://openalex.org/C67905146","wikidata":"https://www.wikidata.org/wiki/Q5287646","display_name":"Document processing","level":2,"score":0.34119999408721924},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.33820000290870667},{"id":"https://openalex.org/C60690694","wikidata":"https://www.wikidata.org/wiki/Q894902","display_name":"Bottom-up parsing","level":4,"score":0.3158999979496002},{"id":"https://openalex.org/C46503548","wikidata":"https://www.wikidata.org/wiki/Q1145976","display_name":"Plain text","level":3,"score":0.31130000948905945},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3082999885082245},{"id":"https://openalex.org/C68476402","wikidata":"https://www.wikidata.org/wiki/Q1456936","display_name":"Table of contents","level":2,"score":0.3001999855041504},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.2971999943256378},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C2778790839","wikidata":"https://www.wikidata.org/wiki/Q6667497","display_name":"Logical form","level":2,"score":0.2928999960422516},{"id":"https://openalex.org/C72773152","wikidata":"https://www.wikidata.org/wiki/Q5287629","display_name":"Document layout analysis","level":3,"score":0.29010000824928284},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C105888452","wikidata":"https://www.wikidata.org/wiki/Q7565148","display_name":"Source document","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.2849000096321106},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2840000092983246},{"id":"https://openalex.org/C67277372","wikidata":"https://www.wikidata.org/wiki/Q7449085","display_name":"Semantic role labeling","level":3,"score":0.27950000762939453},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C2986991398","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntactic structure","level":3,"score":0.25760000944137573},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C53893814","wikidata":"https://www.wikidata.org/wiki/Q7378909","display_name":"Rule-based machine translation","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.22100","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.22100","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.22100","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.22100","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7594968676567078,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Document":[0],"parsing":[1,79,176],"converts":[2],"visually":[3],"rich":[4],"documents":[5,88],"into":[6],"machine-readable":[7],"structured":[8],"representations,":[9],"forming":[10],"a":[11,74,112,170],"crucial":[12],"foundation":[13,172],"for":[14,23,29,48,76,115,173],"information":[15],"systems.":[16],"Although":[17],"many":[18],"benchmarks":[19,33],"have":[20],"been":[21],"proposed":[22],"document":[24,78,94,175],"parsing,":[25,163],"they":[26,53,152],"remain":[27],"inadequate":[28],"realistic":[30,179],"scenarios.":[31,180],"Existing":[32],"either":[34],"focus":[35],"on":[36,148],"specific":[37],"tasks":[38],"or":[39],"assess":[40],"only":[41],"single-page,":[42],"text-centric":[43],"settings,":[44],"making":[45],"them":[46],"insufficient":[47],"practical":[49],"multi-page":[50,77],"parsing.":[51],"Moreover,":[52],"lack":[54],"fine-grained":[55],"evaluation":[56],"of":[57],"semantic":[58,158],"continuity,":[59],"hierarchical":[60,165],"structure":[61,166],"recovery,":[62],"and":[63,98,104,118,124,129,136,164],"visual":[64,161],"content":[65,116,162],"preservation.":[66],"To":[67],"address":[68],"these":[69],"gaps,":[70],"we":[71],"propose":[72],"MPDocBench-Parse,":[73],"benchmark":[75],"in":[80,96,157],"real-world":[81],"applications.":[82],"It":[83],"contains":[84],"433":[85],"manually":[86],"annotated":[87],"with":[89,100],"3,246":[90],"pages,":[91],"covering":[92,121],"15":[93],"types":[95],"English":[97],"Chinese,":[99],"diverse":[101],"layout":[102],"styles,":[103],"supports":[105],"document-level":[106],"end-to-end":[107],"evaluation.":[108],"We":[109],"further":[110],"design":[111],"comprehensive":[113],"protocol":[114],"fidelity":[117],"logical":[119],"structure,":[120],"text,":[122],"table,":[123],"formula":[125],"recognition,":[126],"truncated":[127],"text":[128,150],"table":[130],"merging,":[131],"figure":[132],"extraction,":[133,151],"reading":[134],"order,":[135],"heading":[137],"hierarchy":[138],"recovery.":[139,167],"Experiments":[140],"show":[141],"that,":[142],"while":[143],"existing":[144],"models":[145],"perform":[146],"well":[147],"basic":[149],"still":[153],"suffer":[154],"clear":[155],"limitations":[156],"continuity":[159],"integration,":[160],"MPDocBench-Parse":[168],"provides":[169],"unified":[171],"advancing":[174],"toward":[177],"more":[178]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-23T00:00:00"}
