{"id":"https://openalex.org/W2612400242","doi":"https://doi.org/10.29007/lcmk","title":"Capacity Visual Attention Networks","display_name":"Capacity Visual Attention Networks","publication_year":2018,"publication_date":"2018-01-23","ids":{"openalex":"https://openalex.org/W2612400242","doi":"https://doi.org/10.29007/lcmk","mag":"2612400242"},"language":"en","primary_location":{"id":"doi:10.29007/lcmk","is_oa":true,"landing_page_url":"https://doi.org/10.29007/lcmk","pdf_url":"https://easychair.org/publications/open/RlH","source":{"id":"https://openalex.org/S4220651395","display_name":"EPiC series in computing","issn_l":"2398-7340","issn":["2398-7340"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPiC Series in Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://easychair.org/publications/open/RlH","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050963242","display_name":"Marcus Edel","orcid":"https://orcid.org/0000-0001-5445-7303"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marcus Edel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5039975689","display_name":"Joscha Lausch","orcid":null},"institutions":[{"id":"https://openalex.org/I75951250","display_name":"Freie Universit\u00e4t Berlin","ror":"https://ror.org/046ak2485","country_code":"DE","type":"education","lineage":["https://openalex.org/I75951250"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Joscha Lausch","raw_affiliation_strings":["Freie Universitt Berlin, Berlin, Germany","Freie Universit\u00e4t Berlin, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Freie Universitt Berlin, Berlin, Germany","institution_ids":["https://openalex.org/I75951250"]},{"raw_affiliation_string":"Freie Universit\u00e4t Berlin, Berlin, Germany","institution_ids":["https://openalex.org/I75951250"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5039975689"],"corresponding_institution_ids":["https://openalex.org/I75951250"],"apc_list":null,"apc_paid":null,"fwci":0.1185,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.4084088,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"41","issue":null,"first_page":"72","last_page":"62"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mnist-database","display_name":"MNIST database","score":0.9210058450698853},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8763935565948486},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.7030994892120361},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6402561664581299},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6368468403816223},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.6175608038902283},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5360062122344971},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5285692811012268},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5193873047828674},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4814107418060303},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.47396156191825867},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43318960070610046},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4156051278114319},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38968396186828613},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.11541971564292908}],"concepts":[{"id":"https://openalex.org/C190502265","wikidata":"https://www.wikidata.org/wiki/Q17069496","display_name":"MNIST database","level":3,"score":0.9210058450698853},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8763935565948486},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.7030994892120361},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6402561664581299},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6368468403816223},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.6175608038902283},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5360062122344971},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5285692811012268},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5193873047828674},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4814107418060303},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.47396156191825867},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43318960070610046},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4156051278114319},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38968396186828613},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11541971564292908},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.29007/lcmk","is_oa":true,"landing_page_url":"https://doi.org/10.29007/lcmk","pdf_url":"https://easychair.org/publications/open/RlH","source":{"id":"https://openalex.org/S4220651395","display_name":"EPiC series in computing","issn_l":"2398-7340","issn":["2398-7340"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPiC Series in Computing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.29007/lcmk","is_oa":true,"landing_page_url":"https://doi.org/10.29007/lcmk","pdf_url":"https://easychair.org/publications/open/RlH","source":{"id":"https://openalex.org/S4220651395","display_name":"EPiC series in computing","issn_l":"2398-7340","issn":["2398-7340"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPiC Series in Computing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2612400242.pdf","grobid_xml":"https://content.openalex.org/works/W2612400242.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W330298975","https://openalex.org/W587794757","https://openalex.org/W1484210532","https://openalex.org/W1516887802","https://openalex.org/W1665214252","https://openalex.org/W1757796397","https://openalex.org/W1850742715","https://openalex.org/W1982522767","https://openalex.org/W1985912834","https://openalex.org/W2020683423","https://openalex.org/W2025823130","https://openalex.org/W2064675550","https://openalex.org/W2079735306","https://openalex.org/W2095705004","https://openalex.org/W2097117768","https://openalex.org/W2106874006","https://openalex.org/W2116261113","https://openalex.org/W2117876524","https://openalex.org/W2119717200","https://openalex.org/W2125085157","https://openalex.org/W2136848157","https://openalex.org/W2142037471","https://openalex.org/W2151103935","https://openalex.org/W2162390675","https://openalex.org/W2163605009","https://openalex.org/W2257979135","https://openalex.org/W2335728318","https://openalex.org/W2618530766","https://openalex.org/W2937970997","https://openalex.org/W2951527505","https://openalex.org/W2962719052","https://openalex.org/W2962741254","https://openalex.org/W3099037876","https://openalex.org/W4230563027","https://openalex.org/W4298857966","https://openalex.org/W4303633609","https://openalex.org/W6677408996"],"related_works":["https://openalex.org/W4386603768","https://openalex.org/W2950475743","https://openalex.org/W2886711096","https://openalex.org/W2750384547","https://openalex.org/W4380078352","https://openalex.org/W3036048022","https://openalex.org/W4309224979","https://openalex.org/W3026879719","https://openalex.org/W2969228573","https://openalex.org/W2963690996"],"abstract_inverted_index":{"Inspired":[0],"by":[1,24,51],"recent":[2],"work":[3],"in":[4],"machine":[5],"translation":[6],"and":[7,36,68,87,95,112],"object":[8],"detection,":[9],"we":[10,90],"introduce":[11],"an":[12,22,55],"attention-based":[13],"model":[14,63,82,123],"that":[15,120],"automatically":[16],"learns":[17],"to":[18,62,88,126],"extract":[19],"information":[20],"from":[21],"image":[23,115],"adaptively":[25],"assigning":[26],"its":[27],"capacity":[28,70,94],"across":[29],"different":[30,43],"portions":[31],"of":[32,42,100,131],"the":[33,39,80,98,101,108,121,129],"input":[34,76],"data":[35],"only":[37],"processing":[38],"selected":[40],"regions":[41,77],"sizes":[44],"at":[45],"high":[46],"resolution.":[47],"This":[48,72],"is":[49,84,124],"achieved":[50],"combining":[52],"two":[53],"modules:":[54],"attention":[56,81],"sub-network":[57,73],"which":[58,79,89],"uses":[59],"a":[60,64,69],"mechanism":[61],"human-like":[65],"counting":[66],"process":[67],"sub-network.":[71],"efficiently":[74],"identifies":[75],"for":[78],"output":[83],"most":[85],"sensitive":[86],"should":[91],"devote":[92],"more":[93],"dynamically":[96],"adapt":[97],"size":[99],"region.":[102],"We":[103],"focus":[104],"our":[105],"evaluation":[106],"on":[107],"Cluttered":[109,113],"MNIST,":[110],"SVHN,":[111],"GTSRB":[114],"datasets.":[116],"Our":[117],"findings":[118],"indicate":[119],"proposed":[122],"able":[125],"drastically":[127],"reduce":[128],"number":[130],"computations,":[132],"compared":[133],"with":[134],"traditional":[135],"convolutional":[136],"neural":[137],"networks,":[138],"while":[139],"maintaining":[140],"similar":[141],"or":[142],"better":[143],"performance.":[144]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
