{"id":"https://openalex.org/W2985867184","doi":"https://doi.org/10.1109/access.2020.2982571","title":"Conditionally Learn to Pay Attention for Sequential Visual Task","display_name":"Conditionally Learn to Pay Attention for Sequential Visual Task","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W2985867184","doi":"https://doi.org/10.1109/access.2020.2982571","mag":"2985867184"},"language":"en","primary_location":{"id":"doi:10.1109/access.2020.2982571","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2982571","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09044202.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09044202.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049302472","display_name":"Jun He","orcid":"https://orcid.org/0000-0003-1671-2283"},"institutions":[{"id":"https://openalex.org/I200845125","display_name":"Nanjing University of Information Science and Technology","ror":"https://ror.org/02y0rxk19","country_code":"CN","type":"education","lineage":["https://openalex.org/I200845125"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun He","raw_affiliation_strings":["School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0003-1671-2283","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I200845125"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070277602","display_name":"Quan-Jie Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I200845125","display_name":"Nanjing University of Information Science and Technology","ror":"https://ror.org/02y0rxk19","country_code":"CN","type":"education","lineage":["https://openalex.org/I200845125"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan-Jie Cao","raw_affiliation_strings":["School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I200845125"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076127071","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0001-8749-7459"},"institutions":[{"id":"https://openalex.org/I152031979","display_name":"Nanjing Normal University","ror":"https://ror.org/036trcv74","country_code":"CN","type":"education","lineage":["https://openalex.org/I152031979"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["School of Electrical and Automation Engineering, Nanjing Normal University, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical and Automation Engineering, Nanjing Normal University, Nanjing, China","institution_ids":["https://openalex.org/I152031979"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103041902","display_name":"Hui Tao","orcid":"https://orcid.org/0000-0002-1122-8962"},"institutions":[{"id":"https://openalex.org/I200845125","display_name":"Nanjing University of Information Science and Technology","ror":"https://ror.org/02y0rxk19","country_code":"CN","type":"education","lineage":["https://openalex.org/I200845125"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Tao","raw_affiliation_strings":["School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Nanjing University of Information Science and Technology, Nanjing, China","institution_ids":["https://openalex.org/I200845125"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00471432,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"8","issue":null,"first_page":"56695","last_page":"56710"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8044102787971497},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6854131817817688},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6789400577545166},{"id":"https://openalex.org/keywords/conditional-random-field","display_name":"Conditional random field","score":0.6615018844604492},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6580649614334106},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5623325705528259},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4947144687175751},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.47427472472190857},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.431167334318161},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42447513341903687},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.41814807057380676},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.31637609004974365}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8044102787971497},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6854131817817688},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6789400577545166},{"id":"https://openalex.org/C152565575","wikidata":"https://www.wikidata.org/wiki/Q1124538","display_name":"Conditional random field","level":2,"score":0.6615018844604492},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6580649614334106},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5623325705528259},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4947144687175751},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.47427472472190857},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.431167334318161},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42447513341903687},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.41814807057380676},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31637609004974365},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/access.2020.2982571","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2982571","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09044202.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1911.04365","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1911.04365","pdf_url":"https://arxiv.org/pdf/1911.04365","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:doaj.org/article:5c134e3a08354a408693f8e80d474ae6","is_oa":true,"landing_page_url":"https://doaj.org/article/5c134e3a08354a408693f8e80d474ae6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 8, Pp 56695-56710 (2020)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2020.2982571","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2020.2982571","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/8948470/09044202.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3617193139","display_name":null,"funder_award_id":"61601230","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2985867184.pdf","grobid_xml":"https://content.openalex.org/works/W2985867184.grobid-xml"},"referenced_works_count":62,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W639708223","https://openalex.org/W1484210532","https://openalex.org/W1514535095","https://openalex.org/W1522301498","https://openalex.org/W1686810756","https://openalex.org/W1811254738","https://openalex.org/W1827297289","https://openalex.org/W1861492603","https://openalex.org/W1895577753","https://openalex.org/W1905882502","https://openalex.org/W1956340063","https://openalex.org/W2064675550","https://openalex.org/W2101105183","https://openalex.org/W2127791185","https://openalex.org/W2133459682","https://openalex.org/W2133564696","https://openalex.org/W2143612262","https://openalex.org/W2147527908","https://openalex.org/W2155027007","https://openalex.org/W2221625691","https://openalex.org/W2302086703","https://openalex.org/W2335728318","https://openalex.org/W2463565445","https://openalex.org/W2550553598","https://openalex.org/W2559918205","https://openalex.org/W2611254175","https://openalex.org/W2613718673","https://openalex.org/W2745461083","https://openalex.org/W2753613501","https://openalex.org/W2795151422","https://openalex.org/W2901988662","https://openalex.org/W2951527505","https://openalex.org/W2953301748","https://openalex.org/W2962851944","https://openalex.org/W2962961439","https://openalex.org/W2963443217","https://openalex.org/W2963656855","https://openalex.org/W2964036520","https://openalex.org/W2964121744","https://openalex.org/W2964308564","https://openalex.org/W2965697393","https://openalex.org/W6618372016","https://openalex.org/W6620707391","https://openalex.org/W6628927728","https://openalex.org/W6630875275","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6638685980","https://openalex.org/W6638742206","https://openalex.org/W6639102338","https://openalex.org/W6679149884","https://openalex.org/W6679434410","https://openalex.org/W6682137061","https://openalex.org/W6683204974","https://openalex.org/W6685133223","https://openalex.org/W6692004142","https://openalex.org/W6703116779","https://openalex.org/W6719057275","https://openalex.org/W6743492414","https://openalex.org/W6748666111","https://openalex.org/W6898505805"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W2963177403","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2330246314","https://openalex.org/W2949522393","https://openalex.org/W4301042974"],"abstract_inverted_index":{"Sequential":[0],"visual":[1,97],"task":[2],"usually":[3],"requires":[4],"to":[5,8,66,78,95,190],"pay":[6],"attention":[7,22,28,69,131,155,164,182],"its":[9,15],"current":[10,45],"interested":[11],"object":[12],"conditional":[13,34,80,84,130],"on":[14,137],"previous":[16],"observations.":[17],"Different":[18],"from":[19],"popular":[20,162],"soft":[21,163],"mechanism,":[23],"we":[24],"propose":[25],"a":[26,32,50,101,111,176],"new":[27],"framework":[29],"by":[30,71,90,173],"introducing":[31],"novel":[33],"global":[35,81,85],"feature":[36,41,86],"which":[37],"represents":[38],"the":[39,44,57,68,74,79,134,138,161,186,191],"weak":[40],"descriptor":[42],"of":[43],"focused":[46],"object.":[47],"Specifically,":[48],"for":[49,106,116,151,167,178],"standard":[51],"CNN":[52],"(Convolutional":[53],"Neural":[54],"Network)":[55],"pipeline,":[56],"convolutional":[58,75],"layers":[59],"with":[60,145],"different":[61,91,96],"receptive":[62],"fields":[63],"are":[64],"used":[65],"produce":[67],"maps":[70],"measuring":[72],"how":[73],"features":[76],"align":[77],"feature.":[82],"The":[83],"can":[87,184],"be":[88],"generated":[89],"recurrent":[92,103],"structure":[93],"according":[94],"tasks,":[98],"such":[99],"as":[100],"simple":[102],"neural":[104],"network":[105],"multiple":[107,122,170],"objects":[108,123,171],"recognition,":[109],"or":[110],"moderate":[112],"complex":[113],"language":[114],"model":[115,132,156,183],"image":[117,152],"captioning":[118],"and":[119,166],"weakly":[120,168],"supervised":[121,169],"segmentation.":[124],"Experiments":[125],"show":[126],"that":[127],"our":[128,154,181],"proposed":[129],"achieves":[133],"best":[135],"performance":[136],"SVHN":[139],"(Street":[140],"View":[141],"House":[142],"Numbers)":[143],"dataset":[144],"/":[146],"without":[147],"extra":[148],"bounding":[149],"box;":[150],"caption,":[153],"generates":[157],"better":[158],"scores":[159],"than":[160],"model;":[165],"segmentation,":[172],"simply":[174],"describing":[175],"sentence":[177],"each":[179],"image,":[180],"segment":[185],"salient":[187],"regions":[188],"corresponding":[189],"meaningful":[192],"noun":[193],"words.":[194]},"counts_by_year":[],"updated_date":"2026-07-03T08:13:44.112507","created_date":"2025-10-10T00:00:00"}
