{"id":"https://openalex.org/W3163476226","doi":"https://doi.org/10.1109/icpr48806.2021.9412557","title":"Vision-Based Layout Detection from Scientific Literature using Recurrent Convolutional Neural Networks","display_name":"Vision-Based Layout Detection from Scientific Literature using Recurrent Convolutional Neural Networks","publication_year":2021,"publication_date":"2021-01-10","ids":{"openalex":"https://openalex.org/W3163476226","doi":"https://doi.org/10.1109/icpr48806.2021.9412557","mag":"3163476226"},"language":"en","primary_location":{"id":"doi:10.1109/icpr48806.2021.9412557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109217666","display_name":"Huichen Yang","orcid":"https://orcid.org/0009-0003-8344-9566"},"institutions":[{"id":"https://openalex.org/I189590672","display_name":"Kansas State University","ror":"https://ror.org/05p1j8758","country_code":"US","type":"education","lineage":["https://openalex.org/I189590672"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Huichen Yang","raw_affiliation_strings":["Kansas State University, Manhattan, Kansas, USA"],"affiliations":[{"raw_affiliation_string":"Kansas State University, Manhattan, Kansas, USA","institution_ids":["https://openalex.org/I189590672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103860152","display_name":"William H. Hsu","orcid":null},"institutions":[{"id":"https://openalex.org/I189590672","display_name":"Kansas State University","ror":"https://ror.org/05p1j8758","country_code":"US","type":"education","lineage":["https://openalex.org/I189590672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William H. Hsu","raw_affiliation_strings":["Kansas State University, Manhattan, Kansas, USA"],"affiliations":[{"raw_affiliation_string":"Kansas State University, Manhattan, Kansas, USA","institution_ids":["https://openalex.org/I189590672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5109217666"],"corresponding_institution_ids":["https://openalex.org/I189590672"],"apc_list":null,"apc_paid":null,"fwci":1.7483,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.86626356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"6455","last_page":"6462"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.991599977016449,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8393818736076355},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.7871774435043335},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5954188108444214},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5912621021270752},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5853046178817749},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.528478741645813},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5079289078712463},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.49904537200927734},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4825519919395447},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4821152687072754},{"id":"https://openalex.org/keywords/test-set","display_name":"Test set","score":0.47961270809173584},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46804285049438477},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4494308829307556},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.4444672763347626},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4371919333934784},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4131668210029602},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3343045711517334}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8393818736076355},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.7871774435043335},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5954188108444214},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5912621021270752},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5853046178817749},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.528478741645813},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5079289078712463},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.49904537200927734},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4825519919395447},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4821152687072754},{"id":"https://openalex.org/C169903167","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Test set","level":2,"score":0.47961270809173584},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46804285049438477},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4494308829307556},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.4444672763347626},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4371919333934784},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4131668210029602},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3343045711517334},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr48806.2021.9412557","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412557","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6700000166893005}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W155850152","https://openalex.org/W791527587","https://openalex.org/W1536680647","https://openalex.org/W1861492603","https://openalex.org/W1901129140","https://openalex.org/W1964101267","https://openalex.org/W1976072260","https://openalex.org/W2022351003","https://openalex.org/W2079525773","https://openalex.org/W2091171890","https://openalex.org/W2126925189","https://openalex.org/W2133713322","https://openalex.org/W2163113711","https://openalex.org/W2166633748","https://openalex.org/W2194775991","https://openalex.org/W2526468814","https://openalex.org/W2565639579","https://openalex.org/W2570343428","https://openalex.org/W2766362701","https://openalex.org/W2769316437","https://openalex.org/W2786480153","https://openalex.org/W2787480186","https://openalex.org/W2902089218","https://openalex.org/W2937176418","https://openalex.org/W2953106684","https://openalex.org/W2963446712","https://openalex.org/W2964346820","https://openalex.org/W2970042171","https://openalex.org/W2970987838","https://openalex.org/W2980913015","https://openalex.org/W2989445916","https://openalex.org/W3003334191","https://openalex.org/W3035049382","https://openalex.org/W3105988348","https://openalex.org/W4293584584","https://openalex.org/W6606377508","https://openalex.org/W6620707391","https://openalex.org/W6639102338","https://openalex.org/W6639824700"],"related_works":["https://openalex.org/W3183901164","https://openalex.org/W3135818718","https://openalex.org/W4290188444","https://openalex.org/W3176438653","https://openalex.org/W3167935049","https://openalex.org/W3003905048","https://openalex.org/W2253429366","https://openalex.org/W3127975138","https://openalex.org/W2969228573","https://openalex.org/W3131692135"],"abstract_inverted_index":{"We":[0,94],"present":[1,74],"an":[2,43,80,101],"approach":[3,77],"for":[4,9,148,156,167,180],"adapting":[5],"convolutional":[6,207],"neural":[7,208],"networks":[8,137],"object":[10,102],"recognition":[11],"and":[12,46,53,86,138],"classification":[13],"to":[14,61,66,78,84,115,129,204],"scientific":[15,92,96,181],"literature":[16],"layout":[17,98,183],"detection":[18,103,184],"(SLLD),":[19],"a":[20,75,91,175,194],"shared":[21],"subtask":[22],"of":[23,33,90,135,162,170,193],"several":[24],"information":[25,34,64],"extraction":[26],"problems.":[27],"Scientific":[28],"publications":[29],"contain":[30],"multiple":[31],"types":[32],"sought":[35],"by":[36],"researchers":[37],"in":[38],"various":[39],"disciplines,":[40],"organized":[41],"into":[42,118],"abstract,":[44],"bibliography,":[45],"sections":[47],"documenting":[48],"related":[49],"work,":[50],"experimental":[51,164],"methods,":[52],"results;":[54],"however,":[55],"there":[56],"is":[57,128,146],"no":[58],"effective":[59],"way":[60],"extract":[62],"this":[63,71,142,171,199],"due":[65],"their":[67],"diverse":[68],"layout.":[69],"In":[70],"paper,":[72],"we":[73,173],"novel":[76],"developing":[79],"end-to-end":[81],"learning":[82,132,144],"framework":[83],"segment":[85],"classify":[87],"major":[88],"regions":[89],"document.":[93],"consider":[95],"document":[97,154],"analysis":[99],"as":[100],"task":[104],"over":[105],"digital":[106],"images,":[107],"without":[108],"any":[109],"additional":[110],"text":[111],"features":[112],"that":[113,141,150],"need":[114],"be":[116],"added":[117],"the":[119,122,163,205],"network":[120,197,209],"during":[121],"training":[123,157],"process.":[124],"Our":[125,186],"technical":[126],"objective":[127],"implement":[130],"transfer":[131],"via":[133],"fine-tuning":[134,192],"pre-trained":[136,195],"thereby":[139],"demonstrate":[140],"deep":[143],"architecture":[145],"suitable":[147],"tasks":[149],"lack":[151],"very":[152],"large":[153],"corpora":[155],"ab":[158],"initio.":[159],"As":[160],"part":[161],"test":[165],"bed":[166],"empirical":[168],"evaluation":[169],"approach,":[172],"created":[174],"merged":[176,200],"multi-corpus":[177],"data":[178,201],"set":[179],"publication":[182],"tasks.":[185],"results":[187],"show":[188],"good":[189],"improvement":[190],"with":[191],"base":[196],"using":[198],"set,":[202],"compared":[203],"baseline":[206],"architecture.":[210]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
