{"id":"https://openalex.org/W2606911419","doi":"https://doi.org/10.1109/tip.2017.2695104","title":"Tracking Based Multi-Orientation Scene Text Detection: A Unified Framework With Dynamic Programming","display_name":"Tracking Based Multi-Orientation Scene Text Detection: A Unified Framework With Dynamic Programming","publication_year":2017,"publication_date":"2017-04-18","ids":{"openalex":"https://openalex.org/W2606911419","doi":"https://doi.org/10.1109/tip.2017.2695104","mag":"2606911419","pmid":"https://pubmed.ncbi.nlm.nih.gov/28436864"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2017.2695104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2017.2695104","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015252816","display_name":"Chun Yang","orcid":"https://orcid.org/0000-0002-6297-4500"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chun Yang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074514262","display_name":"Xu-Cheng Yin","orcid":"https://orcid.org/0000-0003-0023-0220"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu-Cheng Yin","raw_affiliation_strings":["Beijing Key Laboratory of Materials Science Knowledge Engineering, School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-0023-0220","affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Materials Science Knowledge Engineering, School of Computer and Communication Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070967152","display_name":"Wei-Yi Pei","orcid":null},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei-Yi Pei","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012986058","display_name":"Shu Tian","orcid":"https://orcid.org/0000-0002-4910-6071"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shu Tian","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017450226","display_name":"Ze-Yu Zuo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ze-Yu Zuo","raw_affiliation_strings":["weibo.com, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"weibo.com, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101989915","display_name":"Chao Zhu","orcid":"https://orcid.org/0000-0001-5486-7492"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Zhu","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087158377","display_name":"Junchi Yan","orcid":"https://orcid.org/0000-0001-9639-7679"},"institutions":[{"id":"https://openalex.org/I4210126794","display_name":"IBM Research (China)","ror":"https://ror.org/02yg1pf55","country_code":"CN","type":"company","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126794"]},{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junchi Yan","raw_affiliation_strings":["Department of Computer Science and Technology, East China Normal University, Shanghai, China","IBM China Research Center, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-9639-7679","affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]},{"raw_affiliation_string":"IBM China Research Center, Shanghai, China","institution_ids":["https://openalex.org/I4210126794"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5015252816"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":2.6809,"has_fulltext":false,"cited_by_count":49,"citation_normalized_percentile":{"value":0.94298412,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"26","issue":"7","first_page":"3235","last_page":"3248"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.814106822013855},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8086718916893005},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7223882079124451},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.7001180648803711},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.5794373750686646},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5092350244522095},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5087316632270813},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4840937852859497},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.47571995854377747},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.44307368993759155},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42068442702293396},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.17352071404457092},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0886874794960022}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.814106822013855},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8086718916893005},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7223882079124451},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.7001180648803711},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.5794373750686646},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5092350244522095},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5087316632270813},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4840937852859497},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.47571995854377747},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.44307368993759155},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42068442702293396},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.17352071404457092},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0886874794960022},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2017.2695104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2017.2695104","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:28436864","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/28436864","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7699999809265137}],"awards":[{"id":"https://openalex.org/G1153650145","display_name":null,"funder_award_id":"61473036","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W29474918","https://openalex.org/W117491841","https://openalex.org/W618799001","https://openalex.org/W1493331862","https://openalex.org/W1547848520","https://openalex.org/W1569095176","https://openalex.org/W1607307044","https://openalex.org/W1649469042","https://openalex.org/W1922126009","https://openalex.org/W1935817682","https://openalex.org/W1971822075","https://openalex.org/W1972065312","https://openalex.org/W1972730516","https://openalex.org/W1978854150","https://openalex.org/W1986965125","https://openalex.org/W1988461287","https://openalex.org/W1992257524","https://openalex.org/W1995052126","https://openalex.org/W1998384060","https://openalex.org/W1999284580","https://openalex.org/W2004681979","https://openalex.org/W2005720384","https://openalex.org/W2019478948","https://openalex.org/W2056435187","https://openalex.org/W2058114646","https://openalex.org/W2060560731","https://openalex.org/W2061802763","https://openalex.org/W2065613686","https://openalex.org/W2071267894","https://openalex.org/W2100396823","https://openalex.org/W2107244081","https://openalex.org/W2124404372","https://openalex.org/W2128854450","https://openalex.org/W2131163834","https://openalex.org/W2131605657","https://openalex.org/W2135231474","https://openalex.org/W2138900418","https://openalex.org/W2142159465","https://openalex.org/W2144554289","https://openalex.org/W2147237076","https://openalex.org/W2148214126","https://openalex.org/W2148819429","https://openalex.org/W2150953273","https://openalex.org/W2153624852","https://openalex.org/W2158061724","https://openalex.org/W2158878654","https://openalex.org/W2159072271","https://openalex.org/W2159374016","https://openalex.org/W2161073567","https://openalex.org/W2163605009","https://openalex.org/W2163876554","https://openalex.org/W2163914840","https://openalex.org/W2165569569","https://openalex.org/W2166274584","https://openalex.org/W2217433794","https://openalex.org/W2288265821","https://openalex.org/W2340583188","https://openalex.org/W2343841668","https://openalex.org/W2369976370","https://openalex.org/W2555860637","https://openalex.org/W2572373566","https://openalex.org/W2606394513","https://openalex.org/W2618530766","https://openalex.org/W4253115048","https://openalex.org/W6604768502","https://openalex.org/W6632893558","https://openalex.org/W6636382570","https://openalex.org/W6642972425","https://openalex.org/W6679510917","https://openalex.org/W6684191040","https://openalex.org/W6731801012"],"related_works":["https://openalex.org/W2328889547","https://openalex.org/W3003858543","https://openalex.org/W1969547578","https://openalex.org/W4312306082","https://openalex.org/W2171488351","https://openalex.org/W2378029901","https://openalex.org/W3023793255","https://openalex.org/W2393063995","https://openalex.org/W2358848605","https://openalex.org/W2965594636"],"abstract_inverted_index":{"There":[0],"are":[1],"a":[2,43,56,63],"variety":[3],"of":[4,122,137],"grand":[5],"challenges":[6],"for":[7],"multi-orientation":[8,47,66,138],"text":[9,29,49,67,83,140],"detection":[10,30,50,68,110],"in":[11,70],"scene":[12,48,139],"videos,":[13,143],"where":[14],"the":[15,109,120,129],"typical":[16],"issues":[17],"include":[18],"skew":[19],"distortion,":[20],"low":[21],"contrast,":[22],"and":[23,81,88,97,116,142,147],"arbitrary":[24],"motion.":[25],"Most":[26],"conventional":[27],"video":[28],"methods":[31],"using":[32,52],"individual":[33],"frames":[34,54,102],"have":[35],"limited":[36],"performance.":[37],"In":[38],"this":[39],"paper,":[40],"we":[41],"propose":[42],"novel":[44],"tracking":[45,93],"based":[46],"method":[51,69],"multiple":[53,86],"within":[55],"unified":[57],"framework":[58],"via":[59],"dynamic":[60,104],"programming.":[61],"First,":[62],"multi-information":[64],"fusion-based":[65],"each":[71],"frame":[72],"is":[73,95,126],"proposed":[74,124],"to":[75,106],"extensively":[76],"locate":[77],"possible":[78],"character":[79],"candidates":[80],"extract":[82],"regions":[84],"with":[85,112,128],"channels":[87],"scales.":[89],"Second,":[90],"an":[91],"optimal":[92],"trajectory":[94],"learned":[96],"linked":[98],"globally":[99],"over":[100],"consecutive":[101],"by":[103],"programming":[105],"finally":[107],"refine":[108],"results":[111],"all":[113],"detection,":[114],"recognition,":[115],"prediction":[117],"information.":[118],"Moreover,":[119],"effectiveness":[121],"our":[123],"system":[125],"evaluated":[127],"state-of-the-art":[130],"performances":[131],"on":[132],"several":[133],"public":[134],"data":[135],"sets":[136],"images":[141],"including":[144],"MSRA-TD500,":[145],"USTB-SV1K,":[146],"ICDAR":[148],"2015":[149],"Scene":[150],"Videos.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":14},{"year":2019,"cited_by_count":7},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
