{"id":"https://openalex.org/W4414253292","doi":"https://doi.org/10.1007/978-3-032-04624-6_13","title":"HisDoc-DETR: Integrating Semantic Learning and\u00a0Feature Fusion for\u00a0Historical Document Layout Analysis","display_name":"HisDoc-DETR: Integrating Semantic Learning and\u00a0Feature Fusion for\u00a0Historical Document Layout Analysis","publication_year":2025,"publication_date":"2025-09-16","ids":{"openalex":"https://openalex.org/W4414253292","doi":"https://doi.org/10.1007/978-3-032-04624-6_13"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-032-04624-6_13","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-032-04624-6_13","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101873754","display_name":"Kai Ding","orcid":"https://orcid.org/0000-0002-4214-1923"},"institutions":[{"id":"https://openalex.org/I4210166174","display_name":"Joint Research Center","ror":"https://ror.org/05a4nj078","country_code":"ES","type":"government","lineage":["https://openalex.org/I1320481043","https://openalex.org/I2800387288","https://openalex.org/I4210161702","https://openalex.org/I4210166174"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Kai Ding","raw_affiliation_strings":["INTSIG-SCUT Joint Lab on Document Analysis and Recognition, Shanghai, China","IntSig Information Co., Ltd, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"INTSIG-SCUT Joint Lab on Document Analysis and Recognition, Shanghai, China","institution_ids":["https://openalex.org/I4210166174"]},{"raw_affiliation_string":"IntSig Information Co., Ltd, Shanghai, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000818862","display_name":"Sheng\u2010Rui Jian","orcid":"https://orcid.org/0000-0003-4925-5832"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sheng Jian","raw_affiliation_strings":["South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080674767","display_name":"Lianwen Jin","orcid":"https://orcid.org/0000-0002-5456-0957"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]},{"id":"https://openalex.org/I4210166174","display_name":"Joint Research Center","ror":"https://ror.org/05a4nj078","country_code":"ES","type":"government","lineage":["https://openalex.org/I1320481043","https://openalex.org/I2800387288","https://openalex.org/I4210161702","https://openalex.org/I4210166174"]}],"countries":["CN","ES"],"is_corresponding":false,"raw_author_name":"Lianwen Jin","raw_affiliation_strings":["INTSIG-SCUT Joint Lab on Document Analysis and Recognition, Shanghai, China","South China University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"INTSIG-SCUT Joint Lab on Document Analysis and Recognition, Shanghai, China","institution_ids":["https://openalex.org/I4210166174"]},{"raw_affiliation_string":"South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101873754"],"corresponding_institution_ids":["https://openalex.org/I4210166174"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.55847255,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"218","last_page":"237"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/document-layout-analysis","display_name":"Document layout analysis","score":0.5782999992370605},{"id":"https://openalex.org/keywords/historical-document","display_name":"Historical document","score":0.5267999768257141},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5192999839782715},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4885999858379364},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4796000123023987},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4564000070095062},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.3910999894142151},{"id":"https://openalex.org/keywords/document-processing","display_name":"Document processing","score":0.3481000065803528}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8970999717712402},{"id":"https://openalex.org/C72773152","wikidata":"https://www.wikidata.org/wiki/Q5287629","display_name":"Document layout analysis","level":3,"score":0.5782999992370605},{"id":"https://openalex.org/C2778371909","wikidata":"https://www.wikidata.org/wiki/Q3771738","display_name":"Historical document","level":2,"score":0.5267999768257141},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5192999839782715},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4885999858379364},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4869000017642975},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4796000123023987},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4564000070095062},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.41769999265670776},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36629998683929443},{"id":"https://openalex.org/C67905146","wikidata":"https://www.wikidata.org/wiki/Q5287646","display_name":"Document processing","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3425999879837036},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.31769999861717224},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3070000112056732},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2888999879360199},{"id":"https://openalex.org/C85407183","wikidata":"https://www.wikidata.org/wiki/Q1045785","display_name":"Semantic network","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2540999948978424},{"id":"https://openalex.org/C188985296","wikidata":"https://www.wikidata.org/wiki/Q868954","display_name":"Page layout","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-032-04624-6_13","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-032-04624-6_13","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1989324344","https://openalex.org/W2055408294","https://openalex.org/W2108959246","https://openalex.org/W2110224595","https://openalex.org/W2120233736","https://openalex.org/W2128060444","https://openalex.org/W2129265797","https://openalex.org/W2135164809","https://openalex.org/W2139970276","https://openalex.org/W2169402356","https://openalex.org/W2565639579","https://openalex.org/W2798826627","https://openalex.org/W2808606449","https://openalex.org/W2962721361","https://openalex.org/W2962834855","https://openalex.org/W2963037989","https://openalex.org/W2963150697","https://openalex.org/W2963351448","https://openalex.org/W2963857746","https://openalex.org/W2964241181","https://openalex.org/W2964346820","https://openalex.org/W2964444661","https://openalex.org/W2970042171","https://openalex.org/W2982770724","https://openalex.org/W2987322772","https://openalex.org/W3034552520","https://openalex.org/W3171660447","https://openalex.org/W3177052299","https://openalex.org/W3186327500","https://openalex.org/W3199093552","https://openalex.org/W3201871940","https://openalex.org/W4214627427","https://openalex.org/W4288064931","https://openalex.org/W4304013646","https://openalex.org/W4304014014","https://openalex.org/W4312312588","https://openalex.org/W4313161517","https://openalex.org/W4319301068","https://openalex.org/W4385990930","https://openalex.org/W4385991153","https://openalex.org/W4386008071","https://openalex.org/W4386065740","https://openalex.org/W4386083123","https://openalex.org/W4390871882","https://openalex.org/W4390872501","https://openalex.org/W4390873840"],"related_works":[],"abstract_inverted_index":null,"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
