{"id":"https://openalex.org/W4309072407","doi":"https://doi.org/10.1186/s40537-022-00664-6","title":"A novel Multi-Layer Attention Framework for visual description prediction using bidirectional LSTM","display_name":"A novel Multi-Layer Attention Framework for visual description prediction using bidirectional LSTM","publication_year":2022,"publication_date":"2022-11-12","ids":{"openalex":"https://openalex.org/W4309072407","doi":"https://doi.org/10.1186/s40537-022-00664-6"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-022-00664-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00664-6","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-022-00664-6","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-022-00664-6","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037889655","display_name":"Dinesh Naik","orcid":"https://orcid.org/0000-0002-8989-6282"},"institutions":[{"id":"https://openalex.org/I11880225","display_name":"National Institute of Technology Karnataka","ror":"https://ror.org/01hz4v948","country_code":"IN","type":"education","lineage":["https://openalex.org/I11880225"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Dinesh Naik","raw_affiliation_strings":["Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India","institution_ids":["https://openalex.org/I11880225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054016512","display_name":"C. D. Jaidhar","orcid":null},"institutions":[{"id":"https://openalex.org/I11880225","display_name":"National Institute of Technology Karnataka","ror":"https://ror.org/01hz4v948","country_code":"IN","type":"education","lineage":["https://openalex.org/I11880225"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"C. D. Jaidhar","raw_affiliation_strings":["Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India","institution_ids":["https://openalex.org/I11880225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5037889655"],"corresponding_institution_ids":["https://openalex.org/I11880225"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":1.9292,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.87532117,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"9","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9779846668243408},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9208593964576721},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5599011182785034},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5527490973472595},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5107874870300293},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4916253685951233},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4865364134311676},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4402525722980499},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.36304354667663574},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3251996636390686},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2586921453475952}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9779846668243408},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9208593964576721},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5599011182785034},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5527490973472595},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5107874870300293},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4916253685951233},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4865364134311676},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4402525722980499},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.36304354667663574},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3251996636390686},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2586921453475952},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-022-00664-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00664-6","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-022-00664-6","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:4421f4de177f4f07bad56de390ffb22b","is_oa":true,"landing_page_url":"https://doaj.org/article/4421f4de177f4f07bad56de390ffb22b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 9, Iss 1, Pp 1-23 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-022-00664-6","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00664-6","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-022-00664-6","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.49000000953674316,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4309072407.pdf","grobid_xml":"https://content.openalex.org/works/W4309072407.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W877909479","https://openalex.org/W1573040851","https://openalex.org/W1586939924","https://openalex.org/W1607035479","https://openalex.org/W1905882502","https://openalex.org/W2064675550","https://openalex.org/W2101105183","https://openalex.org/W2131774270","https://openalex.org/W2139501017","https://openalex.org/W2152984213","https://openalex.org/W2425121537","https://openalex.org/W2523993696","https://openalex.org/W2598789561","https://openalex.org/W2600463316","https://openalex.org/W2739107216","https://openalex.org/W2766375149","https://openalex.org/W2769581371","https://openalex.org/W2803620531","https://openalex.org/W2887712318","https://openalex.org/W2914306086","https://openalex.org/W2945223572","https://openalex.org/W2953461088","https://openalex.org/W2962861647","https://openalex.org/W2963843052","https://openalex.org/W2963916161","https://openalex.org/W2964081807","https://openalex.org/W2964137974","https://openalex.org/W2964241990","https://openalex.org/W2998637494","https://openalex.org/W3112404983","https://openalex.org/W3134875898","https://openalex.org/W3140854437","https://openalex.org/W3163971663","https://openalex.org/W3176923149","https://openalex.org/W3196957659","https://openalex.org/W4211103897","https://openalex.org/W6600234944","https://openalex.org/W6679436768"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W2775506363","https://openalex.org/W3088136942","https://openalex.org/W4290852288","https://openalex.org/W2949362007","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2949522393"],"abstract_inverted_index":{"Abstract":[0],"The":[1,63,78,175],"massive":[2],"influx":[3],"of":[4,17,54,96,103,164,197],"text,":[5],"images,":[6],"and":[7,75,108,132,147,151,187],"videos":[8],"to":[9,30,93,137,182,191],"the":[10,15,52,69,94,99,162,165,192,200],"internet":[11],"has":[12,34],"recently":[13],"increased":[14],"challenge":[16,37],"computer":[18],"vision-based":[19],"tasks":[20],"in":[21,60,185],"big":[22],"data.":[23],"Integrating":[24],"visual":[25,123,148],"data":[26],"with":[27,125,154],"natural":[28],"language":[29],"generate":[31,152],"video":[32,61,65,89,105,173],"explanations":[33],"been":[35],"a":[36,104,117,133,169],"for":[38,111,121,172],"decades.":[39],"However,":[40],"recent":[41],"experiments":[42],"on":[43],"image/video":[44],"captioning":[45,66,112],"that":[46],"employ":[47],"Long-Short-Term-Memory":[48],"(LSTM)":[49],"have":[50],"piqued":[51],"interest":[53],"researchers":[55],"studying":[56],"its":[57],"possible":[58],"application":[59],"captioning.":[62,174],"proposed":[64,201],"architecture":[67,80],"combines":[68],"bidirectional":[70],"multilayer":[71,134],"LSTM":[72],"(BiLSTM)":[73],"encoder":[74],"unidirectional":[76],"decoder.":[77],"innovative":[79],"also":[81],"considers":[82],"temporal":[83],"relations":[84],"when":[85],"creating":[86],"superior":[87,179],"global":[88],"representations.":[90],"In":[91,158,195],"contrast":[92],"majority":[95],"prior":[97],"work,":[98],"most":[100,204],"relevant":[101],"features":[102],"are":[106],"selected":[107],"utilized":[109],"specifically":[110],"purposes.":[113],"Existing":[114],"methods":[115],"utilize":[116],"single-layer":[118],"attention":[119,135],"mechanism":[120,136],"linking":[122],"input":[124],"phrase":[126],"meaning.":[127],"This":[128],"approach":[129,202],"employs":[130],"LSTMs":[131],"extract":[138],"characteristics":[139],"from":[140],"movies,":[141],"construct":[142],"links":[143],"between":[144],"multi-modal":[145],"(words":[146],"material)":[149],"representations,":[150],"sentences":[153],"rich":[155],"semantic":[156],"coherence.":[157],"addition,":[159],"we":[160],"evaluated":[161],"performance":[163,180,189],"suggested":[166],"system":[167],"using":[168],"benchmark":[170],"dataset":[171],"obtained":[176],"results":[177],"reveal":[178],"relative":[181,190],"state-of-the-art":[183],"works":[184],"METEOR":[186],"promising":[188],"BLEU":[193],"score.":[194],"terms":[196],"quantitative":[198],"performance,":[199],"outperforms":[203],"existing":[205],"methodologies.":[206]},"counts_by_year":[{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
