{"id":"https://openalex.org/W7151226466","doi":"https://doi.org/10.48550/arxiv.2604.03836","title":"Cost-Efficient Multi-Scale Fovea for Semantic-Based Visual Search Attention","display_name":"Cost-Efficient Multi-Scale Fovea for Semantic-Based Visual Search Attention","publication_year":2026,"publication_date":"2026-04-04","ids":{"openalex":"https://openalex.org/W7151226466","doi":"https://doi.org/10.48550/arxiv.2604.03836"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03836","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03836","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03836","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133147177","display_name":"Jo\u00e3o Luzio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luzio, Jo\u00e3o","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124111257","display_name":"Alexandre Bernardino","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bernardino, Alexandre","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5102952170","display_name":"Pl\u00ednio Moreno","orcid":"https://orcid.org/0000-0002-0496-2050"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moreno, Plinio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.6764000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.6764000058174133,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.16009999811649323,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.041200000792741776,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/foveal","display_name":"Foveal","score":0.7785999774932861},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.46790000796318054},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4634999930858612},{"id":"https://openalex.org/keywords/human-visual-system-model","display_name":"Human visual system model","score":0.43290001153945923},{"id":"https://openalex.org/keywords/visual-search","display_name":"Visual search","score":0.43149998784065247},{"id":"https://openalex.org/keywords/distortion","display_name":"Distortion (music)","score":0.424699991941452},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4156999886035919},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4153999984264374},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.38119998574256897},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.36399999260902405}],"concepts":[{"id":"https://openalex.org/C30181142","wikidata":"https://www.wikidata.org/wiki/Q865103","display_name":"Foveal","level":3,"score":0.7785999774932861},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7605999708175659},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6728000044822693},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.46790000796318054},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4634999930858612},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4602000117301941},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.43290001153945923},{"id":"https://openalex.org/C158495155","wikidata":"https://www.wikidata.org/wiki/Q2369151","display_name":"Visual search","level":2,"score":0.43149998784065247},{"id":"https://openalex.org/C126780896","wikidata":"https://www.wikidata.org/wiki/Q899871","display_name":"Distortion (music)","level":4,"score":0.424699991941452},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4153999984264374},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.38119998574256897},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.36399999260902405},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.36090001463890076},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35679998993873596},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.34950000047683716},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3116999864578247},{"id":"https://openalex.org/C2781427961","wikidata":"https://www.wikidata.org/wiki/Q430024","display_name":"Human eye","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.29840001463890076},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2953000068664551},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.29280000925064087},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.28349998593330383},{"id":"https://openalex.org/C2778751112","wikidata":"https://www.wikidata.org/wiki/Q835016","display_name":"Window (computing)","level":2,"score":0.2802000045776367},{"id":"https://openalex.org/C2779345533","wikidata":"https://www.wikidata.org/wiki/Q75785","display_name":"Visual cortex","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.27489998936653137},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.27070000767707825},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.266400009393692}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03836","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03836","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03836","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03836","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.4140844941139221,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Semantics":[0],"are":[1],"one":[2],"of":[3,7,29,46,139,174,180],"the":[4,27,30,79,137,172,175,188,215],"primary":[5],"sources":[6],"top-down":[8],"preattentive":[9],"information.":[10],"Modern":[11],"deep":[12,166],"object":[13,167],"detectors":[14,38],"excel":[15],"at":[16,87,111],"extracting":[17],"such":[18],"valuable":[19],"semantic":[20],"cues":[21],"from":[22],"complex":[23],"visual":[24,31,94,149],"scenes.":[25],"However,":[26],"size":[28],"input":[32],"to":[33,73,126,170],"be":[34],"processed":[35],"by":[36,60],"these":[37],"can":[39],"become":[40],"a":[41,68,116],"bottleneck,":[42],"particularly":[43],"in":[44,178],"terms":[45,179],"time":[47],"costs,":[48],"affecting":[49],"an":[50,112],"artificial":[51,70,157],"attention":[52,76],"system's":[53],"biological":[54],"plausibility":[55],"and":[56,160],"real-time":[57],"deployability.":[58],"Inspired":[59],"classical":[61],"exponential":[62],"density":[63],"roll-off":[64],"topologies,":[65],"we":[66,135,205],"apply":[67],"new":[69,176,189],"foveation":[71],"module":[72,192],"our":[74,140],"novel":[75,141],"prediction":[77,202],"pipeline:":[78],"Semantic-based":[80],"Bayesian":[81],"Attention":[82],"(SemBA)":[83],"framework.":[84],"We":[85,151,183],"aim":[86],"reducing":[88],"detection-related":[89],"computational":[90,181],"costs":[91,197],"without":[92],"compromising":[93],"task":[95],"accuracy,":[96],"thereby":[97],"making":[98],"SemBA":[99,208],"more":[100],"biologically":[101],"plausible.":[102],"The":[103],"proposed":[104],"multi-scale":[105],"pyramidal":[106],"field-of-view":[107],"retains":[108],"maximum":[109],"acuity":[110],"innermost":[113],"level,":[114],"around":[115],"focal":[117],"point,":[118],"while":[119,198,213],"gradually":[120],"increasing":[121],"distortion":[122],"for":[123],"outer":[124],"levels":[125],"mimic":[127],"peripheral":[128],"uncertainty":[129],"via":[130],"downsampling.":[131],"In":[132],"this":[133],"work":[134],"evaluate":[136],"performance":[138],"Multi-Scale":[142,190],"Fovea,":[143],"incorporated":[144],"into":[145],"SemBA,":[146],"on":[147],"target-present":[148],"search.":[150],"also":[152],"compare":[153],"it":[154],"against":[155],"other":[156],"foveal":[158],"systems,":[159],"conduct":[161],"ablation":[162],"studies":[163],"with":[164],"different":[165],"detection":[168],"models":[169],"assess":[171],"impact":[173],"topology":[177],"costs.":[182],"experimentally":[184],"demonstrate":[185],"that":[186,207],"including":[187],"Fovea":[191],"effectively":[193],"reduces":[194],"inherent":[195],"processing":[196],"improving":[199],"SemBA's":[200],"scanpath":[201],"accuracy.":[203],"Remarkably,":[204],"show":[206],"closely":[209],"approximates":[210],"human":[211,217],"consistency":[212],"retaining":[214],"actual":[216],"fovea's":[218],"proportions.":[219]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-08T00:00:00"}
