{"id":"https://openalex.org/W2964631447","doi":"https://doi.org/10.1109/wacv45572.2020.9093534","title":"It\u2019s All About The Scale - Efficient Text Detection Using Adaptive Scaling","display_name":"It\u2019s All About The Scale - Efficient Text Detection Using Adaptive Scaling","publication_year":2020,"publication_date":"2020-03-01","ids":{"openalex":"https://openalex.org/W2964631447","doi":"https://doi.org/10.1109/wacv45572.2020.9093534","mag":"2964631447"},"language":"en","primary_location":{"id":"doi:10.1109/wacv45572.2020.9093534","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093534","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1907.12122","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016129501","display_name":"Elad Richardson","orcid":"https://orcid.org/0009-0002-1784-3736"},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Elad Richardson","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034497123","display_name":"Yaniv Azar","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yaniv Azar","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006685812","display_name":"Or Avioz","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Or Avioz","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058995786","display_name":"Niv Geron","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Niv Geron","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065132836","display_name":"Tomer Ronen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomer Ronen","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044027725","display_name":"Zach Avraham","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Zach Avraham","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022357852","display_name":"Stav Shapiro","orcid":null},"institutions":[{"id":"https://openalex.org/I4210132147","display_name":"Penta-Ocean Construction (Japan)","ror":"https://ror.org/03zedkf25","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210132147"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Stav Shapiro","raw_affiliation_strings":["Penta-AI"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Penta-AI","institution_ids":["https://openalex.org/I4210132147"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210132147"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.004501,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1833","last_page":"1842"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.7676888108253479},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.7016288042068481},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.692284345626831},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.6572114825248718},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6505014896392822},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.6289128065109253},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.6054438948631287},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5902972221374512},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5821667313575745},{"id":"https://openalex.org/keywords/property","display_name":"Property (philosophy)","score":0.5148090720176697},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.510158121585846},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.47127243876457214},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.45613744854927063},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.40860143303871155},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3808916509151459},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20707014203071594},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.10947218537330627},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07795947790145874}],"concepts":[{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.7676888108253479},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.7016288042068481},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.692284345626831},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.6572114825248718},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6505014896392822},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.6289128065109253},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.6054438948631287},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5902972221374512},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5821667313575745},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.5148090720176697},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.510158121585846},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.47127243876457214},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.45613744854927063},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.40860143303871155},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3808916509151459},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20707014203071594},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.10947218537330627},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07795947790145874},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/wacv45572.2020.9093534","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093534","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1907.12122","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.12122","pdf_url":"https://arxiv.org/pdf/1907.12122","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2964631447","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1907.12122","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1907.12122","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1907.12122","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1907.12122","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1907.12122","pdf_url":"https://arxiv.org/pdf/1907.12122","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2964631447.pdf","grobid_xml":"https://content.openalex.org/works/W2964631447.grobid-xml"},"referenced_works_count":55,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1903029394","https://openalex.org/W2074849287","https://openalex.org/W2102605133","https://openalex.org/W2144554289","https://openalex.org/W2194775991","https://openalex.org/W2333563142","https://openalex.org/W2339589954","https://openalex.org/W2343052201","https://openalex.org/W2464918637","https://openalex.org/W2565639579","https://openalex.org/W2593539516","https://openalex.org/W2605982830","https://openalex.org/W2614453579","https://openalex.org/W2784050770","https://openalex.org/W2785383245","https://openalex.org/W2800748770","https://openalex.org/W2810028092","https://openalex.org/W2811271212","https://openalex.org/W2875814315","https://openalex.org/W2899771611","https://openalex.org/W2899996070","https://openalex.org/W2901776468","https://openalex.org/W2903269730","https://openalex.org/W2919935710","https://openalex.org/W2922690896","https://openalex.org/W2953106684","https://openalex.org/W2962773189","https://openalex.org/W2962781062","https://openalex.org/W2962810613","https://openalex.org/W2963037989","https://openalex.org/W2963279502","https://openalex.org/W2963418739","https://openalex.org/W2963647456","https://openalex.org/W2963977642","https://openalex.org/W2964018263","https://openalex.org/W2964294787","https://openalex.org/W2967615747","https://openalex.org/W3106228955","https://openalex.org/W3106250896","https://openalex.org/W6620707391","https://openalex.org/W6631190155","https://openalex.org/W6702842988","https://openalex.org/W6719590338","https://openalex.org/W6729791593","https://openalex.org/W6751288959","https://openalex.org/W6752731419","https://openalex.org/W6752879036","https://openalex.org/W6755730432","https://openalex.org/W6756040250","https://openalex.org/W6756361325","https://openalex.org/W6756817110","https://openalex.org/W6760166208","https://openalex.org/W6760673939","https://openalex.org/W6785652829"],"related_works":["https://openalex.org/W2804654955","https://openalex.org/W3154664909","https://openalex.org/W2104384536","https://openalex.org/W119029272","https://openalex.org/W1556839878","https://openalex.org/W2332972075","https://openalex.org/W2744071505","https://openalex.org/W3203852229","https://openalex.org/W2990631821","https://openalex.org/W2083368499","https://openalex.org/W3198519842","https://openalex.org/W1955069752","https://openalex.org/W3090337410","https://openalex.org/W2095366733","https://openalex.org/W2242827783","https://openalex.org/W3045495919","https://openalex.org/W3196078144","https://openalex.org/W3005278309","https://openalex.org/W2738242232","https://openalex.org/W2781955767"],"abstract_inverted_index":{"\"Text":[0],"can":[1],"appear":[2],"anywhere\".":[3],"This":[4,51],"property":[5],"requires":[6],"us":[7,74],"to":[8,19,69,95,99,142,163,173,181,197,205,227],"carefully":[9],"process":[10,96],"all":[11,22,150],"the":[12,28,54,58,75,82,105,127,145,151,154,182,221],"pixels":[13,152],"in":[14,17,81],"an":[15,40,118,122,202],"image":[16,42,60,83,141,167],"order":[18],"accurately":[20],"localize":[21],"text":[23,35,79,131,170],"instances.":[24],"In":[25],"particular,":[26],"for":[27,185],"more":[29],"difficult":[30],"task":[31],"of":[32,57,78,129,153],"localizing":[33],"small":[34],"regions,":[36,171],"many":[37],"methods":[38],"use":[39],"enlarged":[41],"or":[43],"even":[44],"several":[45],"rescaled":[46],"ones":[47],"as":[48],"their":[49,85],"input.":[50],"significantly":[52,103],"increases":[53],"processing":[55,106,149,210],"time":[56],"entire":[59],"and":[61,84,97,215,223],"needlessly":[62],"enlarges":[63],"background":[64],"regions.":[65],"If":[66],"we":[67,88,112],"were":[68],"have":[70,90],"a":[71,114,138,165,174,194],"prior":[72,111,159],"telling":[73],"coarse":[76],"location":[77],"instances":[80],"approximate":[86,144],"scale,":[87,176],"could":[89],"adaptively":[91],"chosen":[92],"which":[93,177],"regions":[94],"how":[98],"rescale":[100],"them,":[101],"thus":[102],"reducing":[104],"time.":[107],"To":[108],"estimate":[109],"this":[110],"propose":[113],"segmentation-based":[115],"network":[116,134,184],"with":[117],"additional":[119],"\"scale":[120],"predictor\",":[121],"output":[123],"channel":[124],"that":[125,190],"predicts":[126],"scale":[128],"each":[130],"segment.":[132],"The":[133,157],"is":[135,160,178],"applied":[136],"on":[137,220],"scaled":[139],"down":[140],"efficiently":[143],"desired":[146],"prior,":[147],"without":[148],"original":[155],"image.":[156],"approximated":[158],"then":[161],"used":[162],"create":[164],"compact":[166],"containing":[168],"only":[169],"resized":[172],"canonical":[175],"fed":[179],"again":[180],"segmentation":[183],"fine-grained":[186],"detection.":[187],"We":[188],"show":[189],"our":[191,229],"approach":[192],"offers":[193],"powerful":[195],"alternative":[196],"fixed":[198],"scaling":[199],"schemes,":[200],"achieving":[201],"equivalent":[203],"accuracy":[204],"larger":[206],"input":[207],"scales":[208],"while":[209],"far":[211],"fewer":[212],"pixels.":[213],"Qualitative":[214],"quantitative":[216],"results":[217],"are":[218],"presented":[219],"ICDAR15":[222],"ICDAR17":[224],"MLT":[225],"benchmarks":[226],"validate":[228],"approach.":[230]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
