{"id":"https://openalex.org/W2902089218","doi":"https://doi.org/10.1109/icpr.2018.8546073","title":"Page Object Detection from PDF Document Images by Deep Structured Prediction and Supervised Clustering","display_name":"Page Object Detection from PDF Document Images by Deep Structured Prediction and Supervised Clustering","publication_year":2018,"publication_date":"2018-08-01","ids":{"openalex":"https://openalex.org/W2902089218","doi":"https://doi.org/10.1109/icpr.2018.8546073","mag":"2902089218"},"language":"en","primary_location":{"id":"doi:10.1109/icpr.2018.8546073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8546073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102885840","display_name":"Xiaohui Li","orcid":"https://orcid.org/0000-0002-0601-1849"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiao-Hui Li","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039310938","display_name":"Fei Yin","orcid":"https://orcid.org/0000-0002-6412-9140"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Yin","raw_affiliation_strings":["University of Chinese Academy of Sciences, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100714202","display_name":"Cheng\u2010Lin Liu","orcid":"https://orcid.org/0000-0002-6743-4175"},"institutions":[{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng-Lin Liu","raw_affiliation_strings":["CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"CAS Center for Excellence of Brain Science and Intelligence Technology, Beijing, P.R. China","institution_ids":["https://openalex.org/I4210097554"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102885840"],"corresponding_institution_ids":["https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":3.0293,"has_fulltext":false,"cited_by_count":56,"citation_normalized_percentile":{"value":0.93987764,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3627","last_page":"3632"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.8407989740371704},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7345433235168457},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7276355624198914},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7038292288780212},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6239997744560242},{"id":"https://openalex.org/keywords/crfs","display_name":"CRFS","score":0.5998340249061584},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5925551652908325},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5673819184303284},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5597230195999146},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5293175578117371},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5218307375907898},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34805262088775635},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3015843629837036}],"concepts":[{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.8407989740371704},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7345433235168457},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7276355624198914},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7038292288780212},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6239997744560242},{"id":"https://openalex.org/C2775953691","wikidata":"https://www.wikidata.org/wiki/Q5013874","display_name":"CRFS","level":3,"score":0.5998340249061584},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5925551652908325},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5673819184303284},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5597230195999146},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5293175578117371},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5218307375907898},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34805262088775635},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3015843629837036}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr.2018.8546073","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr.2018.8546073","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 24th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320326873","display_name":"National Laboratory of Pattern Recognition","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W167260257","https://openalex.org/W639708223","https://openalex.org/W1956861943","https://openalex.org/W2068113013","https://openalex.org/W2090914336","https://openalex.org/W2122950229","https://openalex.org/W2124189704","https://openalex.org/W2124592697","https://openalex.org/W2131163834","https://openalex.org/W2136451330","https://openalex.org/W2147880316","https://openalex.org/W2169282664","https://openalex.org/W2444353601","https://openalex.org/W2613718673","https://openalex.org/W2785462444","https://openalex.org/W2786162033","https://openalex.org/W2786480153","https://openalex.org/W2787335895","https://openalex.org/W2787371088","https://openalex.org/W2787523828","https://openalex.org/W2787835872","https://openalex.org/W2963037989","https://openalex.org/W3106250896","https://openalex.org/W6620707391","https://openalex.org/W6640794857","https://openalex.org/W6682082992","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2356597680","https://openalex.org/W50079190","https://openalex.org/W182104056","https://openalex.org/W2011251309","https://openalex.org/W2511246383","https://openalex.org/W3108423214","https://openalex.org/W2796133761","https://openalex.org/W3088215229","https://openalex.org/W2184553228","https://openalex.org/W2390846138"],"abstract_inverted_index":{"Page":[0],"object":[1,22],"detection":[2],"in":[3,15,49],"document":[4,51],"images":[5,52],"remains":[6],"a":[7,33,54,128,133],"challenge":[8],"because":[9],"the":[10,87,112,121,141,149,154],"page":[11,134],"objects":[12],"are":[13,66,94,130],"diverse":[14],"scale":[16],"and":[17,20,40,47,68,83,89,151],"aspect":[18],"ratio,":[19],"an":[21],"may":[23],"contain":[24],"largely":[25],"apart":[26],"components.":[27],"In":[28],"this":[29],"paper,":[30],"we":[31],"propose":[32],"hybrid":[34],"method":[35],"combining":[36],"deep":[37],"structured":[38],"prediction":[39],"supervised":[41],"clustering":[42,110],"to":[43,101],"detect":[44],"formulas,":[45],"tables":[46],"figures":[48],"PDF":[50],"within":[53,127],"unified":[55],"framework.":[56],"The":[57,107,136],"primitive":[58],"region":[59,65],"proposals":[60],"extracted":[61],"from":[62],"each":[63],"column":[64],"classified":[67],"clustered":[69],"with":[70],"conditional":[71],"random":[72],"field":[73],"(CRF)":[74],"based":[75],"graphical":[76],"models":[77],"which":[78],"can":[79],"integrate":[80],"both":[81],"local":[82],"contextual":[84,105],"information.":[85,106],"Both":[86],"unary":[88],"pairwise":[90],"potentials":[91],"of":[92,115,124,153],"CRFs":[93],"formulated":[95],"as":[96],"convolutional":[97],"neural":[98],"networks":[99],"(CNNs)":[100],"better":[102],"exploit":[103],"spatial":[104],"CRF":[108,119],"for":[109],"predicts":[111],"linked/cut":[113],"label":[114],"between-region":[116],"links.":[117],"After":[118],"inference,":[120],"line":[122],"regions":[123],"same":[125],"class":[126],"cluster":[129],"grouped":[131],"into":[132],"object.":[135],"state-of-the-art":[137],"performance":[138],"obtained":[139],"on":[140],"public":[142],"available":[143],"ICDAR2017":[144],"POD":[145],"competition":[146],"dataset":[147],"demonstrates":[148],"effectiveness":[150],"superiority":[152],"nronosed":[155],"method.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":9},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
