{"id":"https://openalex.org/W2947452845","doi":"https://doi.org/10.1109/spcom.2018.8724400","title":"Recursive Network with Explicit Neighbor Connection for Image Captioning","display_name":"Recursive Network with Explicit Neighbor Connection for Image Captioning","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2947452845","doi":"https://doi.org/10.1109/spcom.2018.8724400","mag":"2947452845"},"language":"en","primary_location":{"id":"doi:10.1109/spcom.2018.8724400","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724400","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002681900","display_name":"Mohammedsayeemuddin K Shaikh","orcid":null},"institutions":[{"id":"https://openalex.org/I98389781","display_name":"Dhirubhai Ambani Institute of Information and Communication Technology","ror":"https://ror.org/02d5b7g69","country_code":"IN","type":"education","lineage":["https://openalex.org/I98389781"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Mohammedsayeemuddin K Shaikh","raw_affiliation_strings":["Dhirubhai Ambani Institute of Information and Communication Technology, Gandhinagar, Gujarat, India"],"affiliations":[{"raw_affiliation_string":"Dhirubhai Ambani Institute of Information and Communication Technology, Gandhinagar, Gujarat, India","institution_ids":["https://openalex.org/I98389781"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101917213","display_name":"Manjunath V. Joshi","orcid":"https://orcid.org/0000-0002-1842-9118"},"institutions":[{"id":"https://openalex.org/I98389781","display_name":"Dhirubhai Ambani Institute of Information and Communication Technology","ror":"https://ror.org/02d5b7g69","country_code":"IN","type":"education","lineage":["https://openalex.org/I98389781"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Manjunath V. Joshi","raw_affiliation_strings":["Dhirubhai Ambani Institute of Information and Communication Technology, Gandhinagar, Gujarat, India"],"affiliations":[{"raw_affiliation_string":"Dhirubhai Ambani Institute of Information and Communication Technology, Gandhinagar, Gujarat, India","institution_ids":["https://openalex.org/I98389781"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5002681900"],"corresponding_institution_ids":["https://openalex.org/I98389781"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.22212076,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"3361","issue":null,"first_page":"392","last_page":"396"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8362946510314941},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.7891526222229004},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.7448120713233948},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.7317487597465515},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5802301168441772},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5406612157821655},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5276583433151245},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.47154998779296875},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4619249701499939},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4458678662776947},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.43158721923828125},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.42663463950157166},{"id":"https://openalex.org/keywords/connection","display_name":"Connection (principal bundle)","score":0.4219311475753784},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40329626202583313},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.32911521196365356},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2496722936630249},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.06447997689247131}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8362946510314941},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.7891526222229004},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.7448120713233948},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.7317487597465515},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5802301168441772},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5406612157821655},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5276583433151245},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.47154998779296875},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4619249701499939},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4458678662776947},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.43158721923828125},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.42663463950157166},{"id":"https://openalex.org/C13355873","wikidata":"https://www.wikidata.org/wiki/Q2920850","display_name":"Connection (principal bundle)","level":2,"score":0.4219311475753784},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40329626202583313},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.32911521196365356},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2496722936630249},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.06447997689247131},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/spcom.2018.8724400","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724400","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W68733909","https://openalex.org/W1514535095","https://openalex.org/W1538131130","https://openalex.org/W1686810756","https://openalex.org/W1706899115","https://openalex.org/W1811254738","https://openalex.org/W1895577753","https://openalex.org/W1897761818","https://openalex.org/W1905882502","https://openalex.org/W1931639407","https://openalex.org/W1947481528","https://openalex.org/W2064675550","https://openalex.org/W2091812280","https://openalex.org/W2109586012","https://openalex.org/W2157331557","https://openalex.org/W2171361956","https://openalex.org/W2185175083","https://openalex.org/W2302086703","https://openalex.org/W2962935746","https://openalex.org/W2964018924","https://openalex.org/W6630875275","https://openalex.org/W6632100814","https://openalex.org/W6639694449","https://openalex.org/W6676497082","https://openalex.org/W6685230081","https://openalex.org/W6730707965","https://openalex.org/W6898505805"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2949522393","https://openalex.org/W4289422896"],"abstract_inverted_index":{"Generating":[0],"natural":[1],"image":[2,31,50],"descriptions":[3],"by":[4,37,43,123,159],"machine":[5],"is":[6,22,32],"a":[7],"non-trivial":[8],"task.":[9],"Many":[10],"researchers":[11],"have":[12,79],"worked":[13],"in":[14,87,117,156],"this":[15,72],"area":[16],"and":[17,40,57,67,99,104],"the":[18,38,44,49,65,68,76,84,88,120,133,141,147,151],"most":[19],"common":[20],"approach":[21],"to":[23,46,78,83,130],"use":[24,91],"encoder-decoder":[25],"framework":[26],"based":[27],"models.":[28],"Here":[29],"an":[30,154],"encoded":[33],"into":[34],"feature":[35],"vector":[36],"encoder":[39,66],"then":[41],"decoded":[42],"decoder":[45,77,98,152],"arrive":[47],"at":[48],"caption.":[51],"Generally":[52],"convolutional":[53],"neural":[54,59],"network":[55,60],"(CNN)":[56],"recurrent":[58,93],"(RNN)":[61],"are":[62],"used":[63],"as":[64,150],"decoder,":[69],"respectively.":[70],"In":[71],"paper,":[73],"we":[74],"modify":[75],"explicit":[80,114,134,148],"memory":[81,115,135],"connection":[82],"previous":[85],"sample":[86],"sequence.":[89],"We":[90],"gated":[92],"unit":[94],"(GRU)":[95],"architecture":[96],"for":[97],"train":[100],"it":[101,139],"on":[102],"Flickr8K":[103,108],"Flickr30K":[105],"datasets.":[106],"For":[107],"dataset,":[109],"results":[110],"show":[111],"that":[112,131],"having":[113],"link":[116,149],"GRU":[118],"improves":[119],"BLEU-4":[121,157],"score":[122,158],"more":[124],"than":[125],"10":[126],"percent":[127],"when":[128],"compared":[129],"without":[132,146],"link.":[136],"Also,":[137],"comparing":[138],"with":[140],"model":[142],"which":[143],"uses":[144],"RNN":[145],"gives":[153],"improvement":[155],"20":[160],"percent.":[161]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
