{"id":"https://openalex.org/W4399115094","doi":"https://doi.org/10.48550/arxiv.2405.17336","title":"XFormParser: A Simple and Effective Multimodal Multilingual Semi-structured Form Parser","display_name":"XFormParser: A Simple and Effective Multimodal Multilingual Semi-structured Form Parser","publication_year":2024,"publication_date":"2024-05-27","ids":{"openalex":"https://openalex.org/W4399115094","doi":"https://doi.org/10.48550/arxiv.2405.17336"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2405.17336","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.17336","pdf_url":"https://arxiv.org/pdf/2405.17336","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2405.17336","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101487855","display_name":"Xianfu Cheng","orcid":"https://orcid.org/0000-0002-4524-7555"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Cheng, Xianfu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100438478","display_name":"Hang Zhang","orcid":"https://orcid.org/0000-0003-2514-0811"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100726984","display_name":"Jian Yang","orcid":"https://orcid.org/0000-0003-4800-832X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102665179","display_name":"Xiang Li","orcid":"https://orcid.org/0000-0001-5026-2349"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101256953","display_name":"Weixiao Zhou","orcid":"https://orcid.org/0009-0006-8929-0834"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Weixiao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029039334","display_name":"Kui Wu","orcid":"https://orcid.org/0000-0002-6857-7231"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Fei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016661432","display_name":"Peiji Liu","orcid":"https://orcid.org/0000-0002-5130-6670"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Kui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107945522","display_name":"Wei Zhang","orcid":"https://orcid.org/0009-0001-4419-4551"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guan, Xiangyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013878664","display_name":"Tao Sun","orcid":"https://orcid.org/0000-0001-8828-1174"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016178437","display_name":"Tongliang Li","orcid":"https://orcid.org/0000-0002-2488-2787"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xianjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036786337","display_name":"Zhoujun Li","orcid":"https://orcid.org/0000-0002-9603-9713"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Tongliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Li, Zhoujun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Zhoujun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5101487855"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9610000252723694,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9577999711036682,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.8120567798614502},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.8060895204544067},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.718890905380249},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.47298797965049744},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35972076654434204},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.055278271436691284}],"concepts":[{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.8120567798614502},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.8060895204544067},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.718890905380249},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.47298797965049744},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35972076654434204},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.055278271436691284},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2405.17336","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.17336","pdf_url":"https://arxiv.org/pdf/2405.17336","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2405.17336","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2405.17336","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2405.17336","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2405.17336","pdf_url":"https://arxiv.org/pdf/2405.17336","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399115094.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W1585007175","https://openalex.org/W2382521049","https://openalex.org/W2390279801","https://openalex.org/W6643695","https://openalex.org/W4381248170","https://openalex.org/W3189621521","https://openalex.org/W2173794830","https://openalex.org/W3204019825"],"abstract_inverted_index":{"In":[0,72],"the":[1,115,137],"domain":[2],"of":[3,20,117,140],"Document":[4,26],"AI,":[5],"parsing":[6,47,59,119,138],"semi-structured":[7,84],"image":[8],"form":[9,34,46],"is":[10,48,120],"a":[11,77,91,109,127],"crucial":[12],"Key":[13],"Information":[14],"Extraction":[15],"(KIE)":[16],"task.":[17],"The":[18,193],"advent":[19],"pre-trained":[21,94,197],"multimodal":[22],"models":[23,198],"significantly":[24,121],"empowers":[25],"AI":[27],"frameworks":[28],"to":[29,161,170],"extract":[30],"key":[31],"information":[32],"from":[33],"documents":[35],"in":[36,57,63,66,142,178,188],"different":[37],"formats":[38],"such":[39],"as":[40],"PDF,":[41],"Word,":[42],"and":[43,60,69,82,97,104,152,190,196],"images.":[44],"Nonetheless,":[45],"still":[49],"encumbered":[50],"by":[51],"notable":[52],"challenges":[53],"like":[54],"subpar":[55],"capabilities":[56],"multilingual":[58,118,189],"diminished":[61],"recall":[62],"industrial":[64,132,144],"contexts":[65],"rich":[67,70],"text":[68],"visuals.":[71],"this":[73],"work,":[74],"we":[75,124],"introduce":[76],"simple":[78],"but":[79],"effective":[80],"\\textbf{M}ultimodal":[81],"\\textbf{M}ultilingual":[83],"\\textbf{FORM}":[85],"\\textbf{PARSER}":[86],"(\\textbf{XFormParser}),":[87],"which":[88],"anchored":[89],"on":[90,157,175],"comprehensive":[92],"Transformer-based":[93],"language":[95],"model":[96],"innovatively":[98],"amalgamates":[99],"semantic":[100],"entity":[101],"recognition":[102],"(SER)":[103],"relation":[105],"extraction":[106],"(RE)":[107],"into":[108],"unified":[110],"framework.":[111],"Combined":[112],"with":[113],"Bi-LSTM,":[114],"performance":[116,186],"improved.":[122],"Furthermore,":[123],"develop":[125],"InDFormSFT,":[126],"pioneering":[128],"supervised":[129],"fine-tuning":[130],"(SFT)":[131],"dataset":[133],"that":[134],"specifically":[135],"addresses":[136],"needs":[139],"forms":[141],"various":[143],"contexts.":[145],"XFormParser":[146,166],"has":[147],"demonstrated":[148],"its":[149],"unparalleled":[150],"effectiveness":[151],"robustness":[153],"through":[154],"rigorous":[155],"testing":[156],"established":[158],"benchmarks.":[159],"Compared":[160],"existing":[162],"state-of-the-art":[163],"(SOTA)":[164],"models,":[165],"notably":[167],"achieves":[168],"up":[169],"1.79\\%":[171],"F1":[172],"score":[173],"improvement":[174],"RE":[176],"tasks":[177],"language-specific":[179],"settings.":[180,192],"It":[181],"also":[182],"exhibits":[183],"exceptional":[184],"cross-task":[185],"improvements":[187],"zero-shot":[191],"codes,":[194],"datasets,":[195],"are":[199],"publicly":[200],"available":[201],"at":[202],"https://github.com/zhbuaa0/xformparser.":[203]},"counts_by_year":[],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2024-05-29T00:00:00"}
