{"id":"https://openalex.org/W3212251668","doi":"https://doi.org/10.1109/icpr56361.2022.9956120","title":"Information Extraction from Visually Rich Documents with Font Style Embeddings","display_name":"Information Extraction from Visually Rich Documents with Font Style Embeddings","publication_year":2022,"publication_date":"2022-08-21","ids":{"openalex":"https://openalex.org/W3212251668","doi":"https://doi.org/10.1109/icpr56361.2022.9956120","mag":"3212251668"},"language":"en","primary_location":{"id":"doi:10.1109/icpr56361.2022.9956120","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr56361.2022.9956120","pdf_url":null,"source":{"id":"https://openalex.org/S4363607731","display_name":"2022 26th International Conference on Pattern Recognition (ICPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052770531","display_name":"Ismail Oussaid","orcid":null},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Ismail Oussaid","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030875491","display_name":"William Vanhuffel","orcid":null},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"William Vanhuffel","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046630430","display_name":"Pirashanth Ratnamogan","orcid":null},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Pirashanth Ratnamogan","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039191316","display_name":"Mhamed Hajaiej","orcid":null},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Mhamed Hajaiej","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001719009","display_name":"Alexis Mathey","orcid":null},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Alexis Mathey","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026727213","display_name":"Thomas Gilles","orcid":"https://orcid.org/0000-0002-5840-1216"},"institutions":[{"id":"https://openalex.org/I95549939","display_name":"BNP Paribas (France)","ror":"https://ror.org/02v616z87","country_code":"FR","type":"company","lineage":["https://openalex.org/I95549939"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Thomas Gilles","raw_affiliation_strings":["BNP Paribas"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"BNP Paribas","institution_ids":["https://openalex.org/I95549939"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2359,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.55015262,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1657","last_page":"1663"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12357","display_name":"Digital Media Forensic Detection","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.828484058380127},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.7812633514404297},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7558519840240479},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.669539749622345},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6634722352027893},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5950213074684143},{"id":"https://openalex.org/keywords/font","display_name":"Font","score":0.5925348997116089},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.5472861528396606},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5236147046089172},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.476428359746933},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4309563636779785},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41260018944740295},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0834847092628479}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.828484058380127},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.7812633514404297},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7558519840240479},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.669539749622345},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6634722352027893},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5950213074684143},{"id":"https://openalex.org/C2777737414","wikidata":"https://www.wikidata.org/wiki/Q4868296","display_name":"Font","level":2,"score":0.5925348997116089},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.5472861528396606},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5236147046089172},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.476428359746933},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4309563636779785},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41260018944740295},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0834847092628479},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr56361.2022.9956120","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr56361.2022.9956120","pdf_url":null,"source":{"id":"https://openalex.org/S4363607731","display_name":"2022 26th International Conference on Pattern Recognition (ICPR)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 26th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8299999833106995}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1506666816","https://openalex.org/W1623072288","https://openalex.org/W1901129140","https://openalex.org/W2001642682","https://openalex.org/W2099001231","https://openalex.org/W2143786659","https://openalex.org/W2144578941","https://openalex.org/W2252143212","https://openalex.org/W2891117443","https://openalex.org/W2896457183","https://openalex.org/W2922714365","https://openalex.org/W2951562155","https://openalex.org/W2962772269","https://openalex.org/W2963150697","https://openalex.org/W2963341956","https://openalex.org/W2980282514","https://openalex.org/W2986619406","https://openalex.org/W2998852125","https://openalex.org/W3000758063","https://openalex.org/W3003484198","https://openalex.org/W3010341014","https://openalex.org/W3034997246","https://openalex.org/W3104953317","https://openalex.org/W3132244696","https://openalex.org/W3176851559","https://openalex.org/W3198984549","https://openalex.org/W3202839357","https://openalex.org/W4385245566","https://openalex.org/W6620707391","https://openalex.org/W6630199436","https://openalex.org/W6636392717","https://openalex.org/W6639824700","https://openalex.org/W6739901393","https://openalex.org/W6755207826","https://openalex.org/W6772827613","https://openalex.org/W6784264348","https://openalex.org/W6785897425","https://openalex.org/W6787566904"],"related_works":["https://openalex.org/W2147687867","https://openalex.org/W2582695981","https://openalex.org/W2496907786","https://openalex.org/W2483185727","https://openalex.org/W2612325988","https://openalex.org/W2490611030","https://openalex.org/W3022607756","https://openalex.org/W2043030904","https://openalex.org/W2327192489","https://openalex.org/W2487016776"],"abstract_inverted_index":{"Information":[0],"extraction":[1],"(IE)":[2],"from":[3],"documents":[4,24],"is":[5,85],"an":[6,92,95,121],"intensive":[7],"area":[8],"of":[9,15,42,77,97,107,113,116],"research":[10],"with":[11,25,104],"a":[12,78,105],"large":[13],"set":[14],"industrial":[16],"applications.":[17],"Current":[18],"state-of-the-art":[19],"methods":[20],"focus":[21],"on":[22,63,88],"scanned":[23],"approaches":[26],"combining":[27],"computer":[28,43],"vision,":[29],"natural":[30],"language":[31],"processing":[32],"and":[33,52,126],"layout":[34],"representation.":[35],"We":[36],"propose":[37],"to":[38,99,120],"challenge":[39],"the":[40,46,89,110,117],"usage":[41],"vision":[44],"in":[45,82,101,109,123],"case":[47],"where":[48],"both":[49,124],"token":[50,71],"style":[51,72],"visual":[53,80],"representation":[54],"are":[55],"available":[56],"(i.e":[57],"native":[58],"PDF":[59],"documents).":[60],"Our":[61],"experiments":[62],"three":[64],"real-world":[65],"complex":[66],"datasets":[67],"demonstrate":[68],"that":[69],"using":[70],"attributes":[73],"based":[74],"embedding":[75,81,93],"instead":[76],"raw":[79],"LayoutLM":[83],"model":[84],"beneficial.":[86],"Depending":[87],"dataset,":[90],"such":[91],"yields":[94],"improvement":[96,122],"0.18%":[98],"2.29%":[100],"weighted":[102],"F1-score":[103],"decrease":[106],"30.7%":[108],"final":[111],"number":[112],"trainable":[114],"parameters":[115],"model,":[118],"leading":[119],"efficiency":[125],"effectiveness.":[127]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
