{"id":"https://openalex.org/W2974212192","doi":"https://doi.org/10.1109/tmm.2019.2941820","title":"Multi-Level Policy and Reward-Based Deep Reinforcement Learning Framework for Image Captioning","display_name":"Multi-Level Policy and Reward-Based Deep Reinforcement Learning Framework for Image Captioning","publication_year":2019,"publication_date":"2019-09-18","ids":{"openalex":"https://openalex.org/W2974212192","doi":"https://doi.org/10.1109/tmm.2019.2941820","mag":"2974212192"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2019.2941820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2941820","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054900679","display_name":"Ning Xu","orcid":"https://orcid.org/0000-0002-7526-4356"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ning Xu","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042324027","display_name":"Hanwang Zhang","orcid":"https://orcid.org/0000-0001-7374-8739"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Hanwang Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081485810","display_name":"An-An Liu","orcid":"https://orcid.org/0000-0001-5755-9145"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"An-An Liu","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001185571","display_name":"Weizhi Nie","orcid":"https://orcid.org/0000-0002-0578-8138"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weizhi Nie","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033713097","display_name":"Yuting Su","orcid":"https://orcid.org/0000-0001-5165-204X"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuting Su","raw_affiliation_strings":["School of Electrical and Information Engineering, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Information Engineering, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058652390","display_name":"Jie Nie","orcid":"https://orcid.org/0000-0003-4952-7666"},"institutions":[{"id":"https://openalex.org/I59028903","display_name":"Ocean University of China","ror":"https://ror.org/04rdtx186","country_code":"CN","type":"education","lineage":["https://openalex.org/I59028903"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Nie","raw_affiliation_strings":["College of Information Science and Engineering, Ocean University of China, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Ocean University of China, Qingdao, China","institution_ids":["https://openalex.org/I59028903"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046305086","display_name":"Yongdong Zhang","orcid":"https://orcid.org/0000-0002-1151-1792"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongdong Zhang","raw_affiliation_strings":["University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5054900679"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":6.7441,"has_fulltext":false,"cited_by_count":111,"citation_normalized_percentile":{"value":0.97469455,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"22","issue":"5","first_page":"1372","last_page":"1383"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9699000120162964,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.989807665348053},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8858833909034729},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7788835763931274},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.615729570388794},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5842153429985046},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5636652708053589},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43631500005722046},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.42652708292007446},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.37238529324531555},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32723376154899597}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.989807665348053},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8858833909034729},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7788835763931274},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.615729570388794},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5842153429985046},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5636652708053589},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43631500005722046},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.42652708292007446},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.37238529324531555},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32723376154899597},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2019.2941820","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2019.2941820","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1149763565","display_name":null,"funder_award_id":"61872267","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2050428177","display_name":null,"funder_award_id":"61772359","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2234015371","display_name":null,"funder_award_id":"A1907","funder_id":"https://openalex.org/F4320322927","funder_display_name":"Zhejiang University"},{"id":"https://openalex.org/G412208199","display_name":null,"funder_award_id":"2019XRX-0035","funder_id":"https://openalex.org/F4320322701","funder_display_name":"Tianjin University"},{"id":"https://openalex.org/G4204336864","display_name":null,"funder_award_id":"2017YFC0820600","funder_id":"https://openalex.org/F4320336026","funder_display_name":"National Key Research and Development Program of China Stem Cell and Translational Research"},{"id":"https://openalex.org/G8290336390","display_name":null,"funder_award_id":"61525206","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322701","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32"},{"id":"https://openalex.org/F4320322927","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884"},{"id":"https://openalex.org/F4320336026","display_name":"National Key Research and Development Program of China Stem Cell and Translational Research","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":84,"referenced_works":["https://openalex.org/W8316075","https://openalex.org/W1486649854","https://openalex.org/W1514535095","https://openalex.org/W1522301498","https://openalex.org/W1527575280","https://openalex.org/W1573040851","https://openalex.org/W1687846465","https://openalex.org/W1811254738","https://openalex.org/W1861492603","https://openalex.org/W1895577753","https://openalex.org/W1897761818","https://openalex.org/W1956340063","https://openalex.org/W1969616664","https://openalex.org/W2019370496","https://openalex.org/W2101105183","https://openalex.org/W2112912048","https://openalex.org/W2114841702","https://openalex.org/W2117539524","https://openalex.org/W2123301721","https://openalex.org/W2130942839","https://openalex.org/W2143449221","https://openalex.org/W2145339207","https://openalex.org/W2149172860","https://openalex.org/W2150824314","https://openalex.org/W2155027007","https://openalex.org/W2171858339","https://openalex.org/W2176263492","https://openalex.org/W2179488730","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2220981600","https://openalex.org/W2257979135","https://openalex.org/W2296385829","https://openalex.org/W2302086703","https://openalex.org/W2407414618","https://openalex.org/W2481240925","https://openalex.org/W2527238922","https://openalex.org/W2550553598","https://openalex.org/W2552161745","https://openalex.org/W2565591417","https://openalex.org/W2565729570","https://openalex.org/W2575842049","https://openalex.org/W2588822708","https://openalex.org/W2593804007","https://openalex.org/W2607151106","https://openalex.org/W2735673432","https://openalex.org/W2737892366","https://openalex.org/W2738318237","https://openalex.org/W2739107216","https://openalex.org/W2745461083","https://openalex.org/W2768661419","https://openalex.org/W2798959609","https://openalex.org/W2807718466","https://openalex.org/W2899771611","https://openalex.org/W2949376505","https://openalex.org/W2962706528","https://openalex.org/W2962887844","https://openalex.org/W2963084599","https://openalex.org/W2963248296","https://openalex.org/W2964018924","https://openalex.org/W2964121744","https://openalex.org/W2964168617","https://openalex.org/W2964253311","https://openalex.org/W3103022576","https://openalex.org/W4249013746","https://openalex.org/W6600334730","https://openalex.org/W6629028937","https://openalex.org/W6630875275","https://openalex.org/W6631190155","https://openalex.org/W6631516269","https://openalex.org/W6637306801","https://openalex.org/W6638742206","https://openalex.org/W6639102338","https://openalex.org/W6639694449","https://openalex.org/W6676647902","https://openalex.org/W6677231853","https://openalex.org/W6678262379","https://openalex.org/W6679436768","https://openalex.org/W6681184217","https://openalex.org/W6682086108","https://openalex.org/W6683204974","https://openalex.org/W6685322675","https://openalex.org/W6714077321","https://openalex.org/W6756040250"],"related_works":["https://openalex.org/W2890653670","https://openalex.org/W3217195652","https://openalex.org/W3119155061","https://openalex.org/W2125145484","https://openalex.org/W4287548803","https://openalex.org/W2945836425","https://openalex.org/W2903179935","https://openalex.org/W2973642807","https://openalex.org/W159132833","https://openalex.org/W4319083788"],"abstract_inverted_index":{"Image":[0],"captioning":[1,25,36,55,104,112,225],"is":[2,26,69],"one":[3],"of":[4,16,47,85,204,216,244],"the":[5,45,51,74,86,122,136,163,173,176,185,191,195,217,230,235,241,245],"most":[6],"challenging":[7],"tasks":[8],"in":[9,34],"AI":[10],"because":[11],"it":[12],"requires":[13],"an":[14],"understanding":[15],"both":[17,153],"complex":[18],"visuals":[19],"and":[20,64,77,79,82,98,138,144,157,175,187,190,220,227,234],"natural":[21],"language.":[22],"Because":[23],"image":[24,35,54,103,224],"essentially":[27],"a":[28,60,94,129,146,154,158,168,202],"sequential":[29],"prediction":[30],"task,":[31],"recent":[32],"advances":[33],"have":[37],"used":[38],"reinforcement":[39],"learning":[40],"(RL)":[41],"to":[42,73,161,171,239],"better":[43],"explore":[44,221],"dynamics":[46],"word-by-word":[48],"generation.":[49],"However,":[50],"existing":[52],"RL-based":[53],"methods":[56],"rely":[57],"primarily":[58],"on":[59,184,201,213],"single":[61],"policy":[62,97,131,174,232],"network":[63,132,233],"reward":[65,99,148,156,160,177,237],"function-an":[66],"approach":[67],"that":[68,105,133,150,194],"not":[70],"well":[71],"matched":[72],"multi-level":[75,96,130,147],"(word":[76],"sentence)":[78],"multi-modal":[80],"(vision":[81],"language)":[83],"nature":[84],"task.":[87],"To":[88],"solve":[89],"this":[90],"problem,":[91],"we":[92,166,209],"propose":[93,167],"novel":[95],"RL":[100,179],"framework":[101,124,197,219],"for":[102,119,141,178,229],"can":[106],"be":[107],"easily":[108],"integrated":[109],"with":[110],"RNN-based":[111],"models,":[113],"language":[114],"metrics,":[115],"or":[116],"visual-semantic":[117],"functions":[118],"optimization.":[120,180],"Specifically,":[121],"proposed":[123,196,218,246],"includes":[125],"two":[126],"modules:":[127],"1)":[128],"jointly":[134],"updates":[135],"word-":[137],"sentence-level":[139],"policies":[140],"word":[142],"generation;":[143],"2)":[145],"function":[149,238],"collaboratively":[151],"leverages":[152],"vision-language":[155],"language-language":[159,236],"guide":[162],"policy.":[164],"Furthermore,":[165],"guidance":[169],"term":[170],"bridge":[172],"The":[181],"extensive":[182],"experiments":[183],"MSCOCO":[186],"Flickr30k":[188],"datasets":[189],"analyses":[192],"show":[193],"achieves":[198],"competitive":[199],"performances":[200],"variety":[203],"evaluation":[205],"metrics.":[206],"In":[207],"addition,":[208],"conduct":[210],"ablation":[211],"studies":[212],"multiple":[214],"variants":[215],"several":[222],"representative":[223],"models":[226],"metrics":[228],"word-level":[231],"evaluate":[240],"generalization":[242],"ability":[243],"framework.":[247]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":20},{"year":2022,"cited_by_count":29},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":18}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
