{"id":"https://openalex.org/W1967245533","doi":"https://doi.org/10.1117/12.2039492","title":"Document page structure learning for fixed-layout e-books using conditional random fields","display_name":"Document page structure learning for fixed-layout e-books using conditional random fields","publication_year":2013,"publication_date":"2013-12-27","ids":{"openalex":"https://openalex.org/W1967245533","doi":"https://doi.org/10.1117/12.2039492","mag":"1967245533"},"language":"en","primary_location":{"id":"doi:10.1117/12.2039492","is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.2039492","pdf_url":null,"source":{"id":"https://openalex.org/S183492911","display_name":"Proceedings of SPIE, the International Society for Optical Engineering/Proceedings of SPIE","issn_l":"0277-786X","issn":["0277-786X","1996-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315543","host_organization_name":"SPIE","host_organization_lineage":["https://openalex.org/P4310315543"],"host_organization_lineage_names":["SPIE"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SPIE Proceedings","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100624769","display_name":"Xin Tao","orcid":"https://orcid.org/0000-0002-5107-9068"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Tao","raw_affiliation_strings":["Peking Univ. (China)"],"affiliations":[{"raw_affiliation_string":"Peking Univ. (China)","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103175239","display_name":"Zhi Tang","orcid":"https://orcid.org/0000-0002-6021-8357"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4391767988","display_name":"State Key Laboratory of Digital Publishing Technology","ror":"https://ror.org/021s6g098","country_code":null,"type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I4391767988"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhi Tang","raw_affiliation_strings":["Peking Univ. (China)","State Key Lab. of Digital Publishing Technology (China)"],"affiliations":[{"raw_affiliation_string":"Peking Univ. (China)","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"State Key Lab. of Digital Publishing Technology (China)","institution_ids":["https://openalex.org/I4391767988"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084189725","display_name":"Canhui Xu","orcid":"https://orcid.org/0000-0002-9907-6747"},"institutions":[{"id":"https://openalex.org/I4391767988","display_name":"State Key Laboratory of Digital Publishing Technology","ror":"https://ror.org/021s6g098","country_code":null,"type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I4391767988"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Canhui Xu","raw_affiliation_strings":["Peking Univ. (China)","State Key Lab. of Digital Publishing Technology (China)"],"affiliations":[{"raw_affiliation_string":"Peking Univ. (China)","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"State Key Lab. of Digital Publishing Technology (China)","institution_ids":["https://openalex.org/I4391767988"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100624769"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.05424956,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"9021","issue":null,"first_page":"90210I","last_page":"90210I"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.9018906354904175},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8094302415847778},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.73935866355896},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6353448629379272},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6166824698448181},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.536742627620697},{"id":"https://openalex.org/keywords/macro","display_name":"Macro","score":0.49395495653152466},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.46440744400024414},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4587964713573456},{"id":"https://openalex.org/keywords/tree-structure","display_name":"Tree structure","score":0.4550500810146332},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40378955006599426},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3943207859992981},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3807445764541626},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2861655354499817},{"id":"https://openalex.org/keywords/binary-tree","display_name":"Binary tree","score":0.2559252679347992},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15243670344352722}],"concepts":[{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.9018906354904175},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8094302415847778},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.73935866355896},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6353448629379272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6166824698448181},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.536742627620697},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.49395495653152466},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.46440744400024414},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4587964713573456},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.4550500810146332},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40378955006599426},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3943207859992981},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3807445764541626},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2861655354499817},{"id":"https://openalex.org/C197855036","wikidata":"https://www.wikidata.org/wiki/Q380172","display_name":"Binary tree","level":2,"score":0.2559252679347992},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15243670344352722},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1117/12.2039492","is_oa":false,"landing_page_url":"https://doi.org/10.1117/12.2039492","pdf_url":null,"source":{"id":"https://openalex.org/S183492911","display_name":"Proceedings of SPIE, the International Society for Optical Engineering/Proceedings of SPIE","issn_l":"0277-786X","issn":["0277-786X","1996-756X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315543","host_organization_name":"SPIE","host_organization_lineage":["https://openalex.org/P4310315543"],"host_organization_lineage_names":["SPIE"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SPIE Proceedings","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.7699999809265137,"display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W44597921","https://openalex.org/W1618905105","https://openalex.org/W1981791873","https://openalex.org/W1989491834","https://openalex.org/W1998795455","https://openalex.org/W2002399343","https://openalex.org/W2005777475","https://openalex.org/W2016485096","https://openalex.org/W2047334181","https://openalex.org/W2048458520","https://openalex.org/W2051434435","https://openalex.org/W2062843843","https://openalex.org/W2077079264","https://openalex.org/W2100735443","https://openalex.org/W2133251346","https://openalex.org/W2140479099","https://openalex.org/W2144777592","https://openalex.org/W2162267467","https://openalex.org/W2505790104","https://openalex.org/W3144833350","https://openalex.org/W4237385507","https://openalex.org/W4253723135","https://openalex.org/W6636501900","https://openalex.org/W6650686273","https://openalex.org/W6654257724"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W2356597680","https://openalex.org/W3103844505","https://openalex.org/W2030816003","https://openalex.org/W2163278254","https://openalex.org/W155708904","https://openalex.org/W1574213390","https://openalex.org/W1487808658"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"a":[3],"model":[4,56,110],"is":[5,83],"proposed":[6,55],"to":[7,28,59],"learn":[8],"logical":[9,30,62],"structure":[10],"of":[11,68,79,85,89,114],"fixed-layout":[12],"document":[13],"pages":[14],"by":[15,117],"combining":[16],"support":[17],"vector":[18],"machine":[19],"(SVM)":[20],"and":[21,32,48,74,103],"conditional":[22],"random":[23],"fields":[24],"(CRF).":[25],"Features":[26],"related":[27],"each":[29],"label":[31],"their":[33],"dependencies":[34,50],"are":[35,51],"extracted":[36],"from":[37],"various":[38],"original":[39],"Portable":[40],"Document":[41],"Format":[42],"(PDF)":[43],"attributes.":[44],"Both":[45],"local":[46,71],"evidence":[47],"contextual":[49,77],"integrated":[52],"in":[53],"the":[54,66,87,108],"so":[57],"as":[58,70],"achieve":[60],"better":[61],"labeling":[63],"performance.":[64],"With":[65],"merits":[67],"SVM":[69,109],"discriminative":[72],"classifier":[73],"CRF":[75,97],"modeling":[76],"correlations":[78],"adjacent":[80],"fragments,":[81],"it":[82],"capable":[84],"resolving":[86],"ambiguities":[88],"semantic":[90],"labels.":[91],"The":[92],"experimental":[93],"results":[94],"show":[95],"that":[96],"based":[98],"models":[99],"with":[100,111],"both":[101],"tree":[102],"chain":[104],"graph":[105],"structures":[106],"outperform":[107],"an":[112],"increase":[113],"macro-averaged":[115],"F<sub>1</sub>":[116],"about":[118],"10%.":[119]},"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
