{"id":"https://openalex.org/W7140527763","doi":"https://doi.org/10.48550/arxiv.2603.23511","title":"DISCO: Document Intelligence Suite for COmparative Evaluation","display_name":"DISCO: Document Intelligence Suite for COmparative Evaluation","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7140527763","doi":"https://doi.org/10.48550/arxiv.2603.23511"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.23511","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23511","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.23511","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114601845","display_name":"Kenza Benkirane","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Benkirane, Kenza","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064040711","display_name":"Dan Goldwater","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goldwater, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004304345","display_name":"Martin Asenov","orcid":"https://orcid.org/0000-0003-4610-3112"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Asenov, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5083561499","display_name":"Aneiss Ghodsi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghodsi, Aneiss","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9620000123977661,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9620000123977661,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.012900000438094139,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.010300000198185444,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.733299970626831},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.617900013923645},{"id":"https://openalex.org/keywords/document-processing","display_name":"Document processing","score":0.5582000017166138},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.4948999881744385},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.45570001006126404},{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.4408999979496002},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.41620001196861267},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4153999984264374}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8095999956130981},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.733299970626831},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.617900013923645},{"id":"https://openalex.org/C67905146","wikidata":"https://www.wikidata.org/wiki/Q5287646","display_name":"Document processing","level":2,"score":0.5582000017166138},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5374000072479248},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5174000263214111},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.4948999881744385},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.47440001368522644},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.45570001006126404},{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.4408999979496002},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.41620001196861267},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4153999984264374},{"id":"https://openalex.org/C2779500292","wikidata":"https://www.wikidata.org/wiki/Q14802672","display_name":"Text processing","level":2,"score":0.3684000074863434},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3621000051498413},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.2969000041484833},{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.290800005197525},{"id":"https://openalex.org/C164614171","wikidata":"https://www.wikidata.org/wiki/Q5204775","display_name":"DECIPHER","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C2983812711","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text recognition","level":3,"score":0.2800999879837036},{"id":"https://openalex.org/C2777737414","wikidata":"https://www.wikidata.org/wiki/Q4868296","display_name":"Font","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.23511","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23511","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.23511","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.23511","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5188370943069458}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Document":[0],"intelligence":[1],"requires":[2],"accurate":[3],"text":[4,89,100],"extraction":[5],"and":[6,29,36,51,63,81,101,135],"reliable":[7,78],"reasoning":[8,136],"over":[9],"document":[10,41,64,114,128,133],"content.":[11],"We":[12],"introduce":[13],"\\textbf{DISCO},":[14],"a":[15],"\\emph{Document":[16],"Intelligence":[17],"Suite":[18],"for":[19,69,79,82,126],"COmparative":[20],"Evaluation},":[21],"that":[22,57],"evaluates":[23],"optical":[24],"character":[25],"recognition":[26],"(OCR)":[27],"pipelines":[28,74],"vision-language":[30],"models":[31],"(VLMs)":[32],"separately":[33],"on":[34,98,112,119,132],"parsing":[35],"question":[37],"answering":[38],"across":[39,61],"diverse":[40],"types,":[42],"including":[43],"handwritten":[44],"text,":[45],"multilingual":[46,99],"scripts,":[47],"medical":[48],"forms,":[49],"infographics,":[50],"multi-page":[52,85],"documents.":[53],"Our":[54],"evaluation":[55],"shows":[56],"performance":[58,111],"varies":[59],"substantially":[60],"tasks":[62],"characteristics,":[65],"underscoring":[66],"the":[67],"need":[68],"complexity-aware":[70],"approach":[71],"selection.":[72],"OCR":[73],"are":[75],"generally":[76],"more":[77],"handwriting":[80],"long":[83],"or":[84],"documents,":[86],"where":[87],"explicit":[88],"grounding":[90],"supports":[91],"text-heavy":[92],"reasoning,":[93],"while":[94,116],"VLMs":[95],"perform":[96],"better":[97],"visually":[102],"rich":[103],"layouts.":[104],"Task-aware":[105],"prompting":[106],"yields":[107],"mixed":[108],"effects,":[109],"improving":[110],"some":[113],"types":[115],"degrading":[117],"it":[118],"others.":[120],"These":[121],"findings":[122],"provide":[123],"empirical":[124],"guidance":[125],"selecting":[127],"processing":[129],"strategies":[130],"based":[131],"structure":[134],"demands.":[137]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-27T00:00:00"}
