{"id":"https://openalex.org/W2044181395","doi":"https://doi.org/10.1109/tcsvt.2014.2305515","title":"Semiautomatic Ground Truth Generation for Text Detection and Recognition in Video Images","display_name":"Semiautomatic Ground Truth Generation for Text Detection and Recognition in Video Images","publication_year":2014,"publication_date":"2014-02-12","ids":{"openalex":"https://openalex.org/W2044181395","doi":"https://doi.org/10.1109/tcsvt.2014.2305515","mag":"2044181395"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2014.2305515","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2014.2305515","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110767730","display_name":"Trung Quy Phan","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Trung Quy Phan","raw_affiliation_strings":["Department of Computer Science, National University of Singapore, Singapore","[Department of Computer ScienceSchool of Computing, National University of Singapore, Singapore]"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"[Department of Computer ScienceSchool of Computing, National University of Singapore, Singapore]","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025871978","display_name":"Palaiahnakote Shivakumara","orcid":"https://orcid.org/0000-0001-9026-4613"},"institutions":[{"id":"https://openalex.org/I1323252656","display_name":"Information Technology University","ror":"https://ror.org/00ngv8j44","country_code":"PK","type":"education","lineage":["https://openalex.org/I1323252656"]},{"id":"https://openalex.org/I33849332","display_name":"University of Malaya","ror":"https://ror.org/00rzspn62","country_code":"MY","type":"education","lineage":["https://openalex.org/I33849332"]}],"countries":["MY","PK"],"is_corresponding":false,"raw_author_name":"Palaiahnakote Shivakumara","raw_affiliation_strings":["Department of Computer Systems and Information Technology, University of Malaya, Kuala Lampur, Malaysia","Department of Computer Systems and Information Technology, University of Malaya, Kuala Lampur, Malaysia#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Systems and Information Technology, University of Malaya, Kuala Lampur, Malaysia","institution_ids":["https://openalex.org/I33849332"]},{"raw_affiliation_string":"Department of Computer Systems and Information Technology, University of Malaya, Kuala Lampur, Malaysia#TAB#","institution_ids":["https://openalex.org/I1323252656"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068862616","display_name":"Souvik Bhowmick","orcid":null},"institutions":[{"id":"https://openalex.org/I6498739","display_name":"Indian Statistical Institute","ror":"https://ror.org/00q2w1j53","country_code":"IN","type":"education","lineage":["https://openalex.org/I6498739"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Souvik Bhowmick","raw_affiliation_strings":["Indian Statistical Institute, Kolkata, India","Indian Statistical Institute  Kolkata India"],"affiliations":[{"raw_affiliation_string":"Indian Statistical Institute, Kolkata, India","institution_ids":["https://openalex.org/I6498739"]},{"raw_affiliation_string":"Indian Statistical Institute  Kolkata India","institution_ids":["https://openalex.org/I6498739"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102833854","display_name":"Shimiao Li","orcid":"https://orcid.org/0000-0002-8744-221X"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shimiao Li","raw_affiliation_strings":["Institute for Infocomm Research (I2R), Singapore","Institute for InfoComm Research (I2R), Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000"]},{"raw_affiliation_string":"Institute for InfoComm Research (I2R), Singapore","institution_ids":["https://openalex.org/I3005327000"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111664929","display_name":"Chew Lim Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Chew Lim Tan","raw_affiliation_strings":["Department of Computer Science, National University of Singapore, Singapore","[Department of Computer ScienceSchool of Computing, National University of Singapore, Singapore]"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]},{"raw_affiliation_string":"[Department of Computer ScienceSchool of Computing, National University of Singapore, Singapore]","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068803496","display_name":"Umapada Pal","orcid":"https://orcid.org/0000-0002-5426-2618"},"institutions":[{"id":"https://openalex.org/I6498739","display_name":"Indian Statistical Institute","ror":"https://ror.org/00q2w1j53","country_code":"IN","type":"education","lineage":["https://openalex.org/I6498739"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Umapada Pal","raw_affiliation_strings":["Indian Statistical Institute, Kolkata, India","Indian Statistical Institute  Kolkata India"],"affiliations":[{"raw_affiliation_string":"Indian Statistical Institute, Kolkata, India","institution_ids":["https://openalex.org/I6498739"]},{"raw_affiliation_string":"Indian Statistical Institute  Kolkata India","institution_ids":["https://openalex.org/I6498739"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5110767730"],"corresponding_institution_ids":["https://openalex.org/I165932596"],"apc_list":null,"apc_paid":null,"fwci":0.9755,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.8000315,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"24","issue":"8","first_page":"1277","last_page":"1287"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12707","display_name":"Vehicle License Plate Recognition","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.8244038224220276},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8131605982780457},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6940256953239441},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6801466941833496},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.6214946508407593},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6040971875190735},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.5972498655319214},{"id":"https://openalex.org/keywords/text-detection","display_name":"Text detection","score":0.574721097946167},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.5563609600067139},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5537291765213013},{"id":"https://openalex.org/keywords/line","display_name":"Line (geometry)","score":0.420657217502594},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.38114017248153687},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37930700182914734},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0870937705039978}],"concepts":[{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.8244038224220276},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8131605982780457},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6940256953239441},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6801466941833496},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.6214946508407593},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6040971875190735},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.5972498655319214},{"id":"https://openalex.org/C2983589003","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Text detection","level":3,"score":0.574721097946167},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.5563609600067139},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5537291765213013},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.420657217502594},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.38114017248153687},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37930700182914734},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0870937705039978},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C194257627","wikidata":"https://www.wikidata.org/wiki/Q211554","display_name":"Amplifier","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2014.2305515","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2014.2305515","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6600000262260437,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G3375617695","display_name":null,"funder_award_id":"092-101-0051","funder_id":"https://openalex.org/F4320320696","funder_display_name":"Agency for Science, Technology and Research"}],"funders":[{"id":"https://openalex.org/F4320320696","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1497790312","https://openalex.org/W1972065312","https://openalex.org/W1972774730","https://openalex.org/W1979370021","https://openalex.org/W1989327159","https://openalex.org/W1998042868","https://openalex.org/W2005402843","https://openalex.org/W2008806374","https://openalex.org/W2014286161","https://openalex.org/W2016167924","https://openalex.org/W2027883219","https://openalex.org/W2029263174","https://openalex.org/W2034865967","https://openalex.org/W2049574251","https://openalex.org/W2056518953","https://openalex.org/W2061802763","https://openalex.org/W2073152945","https://openalex.org/W2083868436","https://openalex.org/W2094497597","https://openalex.org/W2099063119","https://openalex.org/W2099306567","https://openalex.org/W2117586922","https://openalex.org/W2121839820","https://openalex.org/W2123827229","https://openalex.org/W2130475102","https://openalex.org/W2131447359","https://openalex.org/W2134378185","https://openalex.org/W2137718414","https://openalex.org/W2137969867","https://openalex.org/W2140132917","https://openalex.org/W2141822239","https://openalex.org/W2142082467","https://openalex.org/W2142159465","https://openalex.org/W2142907989","https://openalex.org/W2165569569","https://openalex.org/W2166949156","https://openalex.org/W6642972425","https://openalex.org/W6649973027","https://openalex.org/W6657635057","https://openalex.org/W6681726749","https://openalex.org/W6684363135"],"related_works":["https://openalex.org/W2745033168","https://openalex.org/W3003821897","https://openalex.org/W4235251315","https://openalex.org/W2964561015","https://openalex.org/W2906951608","https://openalex.org/W4200016224","https://openalex.org/W2112430355","https://openalex.org/W2725486421","https://openalex.org/W2781529199","https://openalex.org/W2044181395"],"abstract_inverted_index":{"Although":[0],"a":[1,46,71,138],"large":[2],"number":[3],"of":[4,29,31,65,105,115,119,132,143,188,208],"methods":[5,198],"for":[6,49,53],"video":[7,54,145,155],"text":[8,55,64,116,120,196],"detection":[9,56,197],"and":[10,36,57,62,125,151,170,175,182,203,215],"recognition":[11],"have":[12],"been":[13],"proposed":[14,190],"over":[15],"the":[16,24,75,80,84,95,130,133,186,189,216,223],"past":[17],"years,":[18],"it":[19],"is":[20,192],"hard":[21],"to":[22,73,77,128,205,222],"find":[23],"best":[25],"state-of-the-art":[26],"method":[27,86],"because":[28],"nonavailability":[30],"standard":[32],"datasets,":[33],"ground":[34,50,81,213],"truth,":[35],"common":[37],"evaluation":[38],"measures.":[39],"Therefore,":[40],"in":[41,157],"this":[42],"paper,":[43],"we":[44],"propose":[45,91],"semiautomatic":[47,210,217],"system":[48,69,191,218],"truth":[51,82,214],"generation":[52],"recognition,":[58],"which":[59],"includes":[60],"English":[61,168,181],"Chinese":[63,173],"different":[66],"orientation.":[67],"The":[68,154,212],"has":[70],"facility":[72],"allow":[74],"user":[76],"manually":[78,202],"correct":[79],"if":[83],"automatic":[85],"produces":[87],"incorrect":[88],"results.":[89],"We":[90,135],"eleven":[92],"attributes":[93],"at":[94],"word":[96,101],"level,":[97],"namely:":[98],"line":[99],"index,":[100,102],"coordinate":[103],"values":[104],"bounding":[106],"box,":[107],"area,":[108],"content,":[109],"script":[110],"type,":[111],"orientation":[112],"information,":[113],"type":[114],"(caption/scene),":[117],"condition":[118],"(distortion/distortion":[121],"free),":[122],"start":[123],"frame,":[124],"end":[126],"frame":[127],"evaluate":[129],"performance":[131,187],"method.":[134],"also":[136],"introduce":[137],"new":[139],"dataset":[140,159],"that":[141],"consists":[142],"466":[144],"frames":[146,156],"collected":[147],"from":[148],"TRECVID":[149],"2005":[150],"2006":[152],"databases.":[153],"our":[158,209],"contain":[160],"both":[161],"horizontal":[162],"texts":[163,169,177],"(278":[164],"frames:":[165,179],"181":[166],"with":[167,172,194],"97":[171],"texts)":[174],"nonhorizontal":[176],"(188":[178],"140":[180],"48":[183],"Chinese).":[184],"Furthermore,":[185],"compared":[193],"existing":[195],"by":[199],"calculating":[200],"measures":[201],"automatically":[204],"show":[206],"usefulness":[207],"system.":[211],"will":[219],"be":[220],"released":[221],"public.":[224]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":3},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
