{"id":"https://openalex.org/W7124842787","doi":"https://doi.org/10.1109/cvmi66673.2025.11337710","title":"From Images to Insights: A Scientometric Study of Image Captioning Research from 2021 to 2025","display_name":"From Images to Insights: A Scientometric Study of Image Captioning Research from 2021 to 2025","publication_year":2025,"publication_date":"2025-10-12","ids":{"openalex":"https://openalex.org/W7124842787","doi":"https://doi.org/10.1109/cvmi66673.2025.11337710"},"language":null,"primary_location":{"id":"doi:10.1109/cvmi66673.2025.11337710","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvmi66673.2025.11337710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123392478","display_name":"Marvi Jasrotia","orcid":null},"institutions":[{"id":"https://openalex.org/I3129773123","display_name":"Bennett University","ror":"https://ror.org/00an5hx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I3129773123"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Marvi Jasrotia","raw_affiliation_strings":["School of CSET, Bennett University,Greater Noida,U.P.,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of CSET, Bennett University,Greater Noida,U.P.,India","institution_ids":["https://openalex.org/I3129773123"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123430158","display_name":"Himanshu Sharma","orcid":null},"institutions":[{"id":"https://openalex.org/I3129773123","display_name":"Bennett University","ror":"https://ror.org/00an5hx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I3129773123"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Himanshu Sharma","raw_affiliation_strings":["School of CSET, Bennett University,Greater Noida,U.P.,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of CSET, Bennett University,Greater Noida,U.P.,India","institution_ids":["https://openalex.org/I3129773123"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5104316068","display_name":"Ashwani Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I3129773123","display_name":"Bennett University","ror":"https://ror.org/00an5hx75","country_code":"IN","type":"education","lineage":["https://openalex.org/I3129773123"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ashwani Kumar","raw_affiliation_strings":["School of CSET, Bennett University,Greater Noida,U.P.,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of CSET, Bennett University,Greater Noida,U.P.,India","institution_ids":["https://openalex.org/I3129773123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.6110239,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9713000059127808,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9713000059127808,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.0020000000949949026,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0013000000035390258,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9650999903678894},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.6273999810218811},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5335999727249146},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.49320000410079956},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4713999927043915},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4406999945640564}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9650999903678894},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6674000024795532},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.6273999810218811},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5335999727249146},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5307999849319458},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.49320000410079956},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4713999927043915},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4648999869823456},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4406999945640564},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.40619999170303345},{"id":"https://openalex.org/C2778805511","wikidata":"https://www.wikidata.org/wiki/Q1713","display_name":"Citation","level":2,"score":0.3840000033378601},{"id":"https://openalex.org/C525823164","wikidata":"https://www.wikidata.org/wiki/Q472342","display_name":"Scientometrics","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C178315738","wikidata":"https://www.wikidata.org/wiki/Q603441","display_name":"Bibliometrics","level":2,"score":0.33329999446868896},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.32330000400543213},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3224000036716461},{"id":"https://openalex.org/C191935318","wikidata":"https://www.wikidata.org/wiki/Q148","display_name":"China","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26489999890327454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvmi66673.2025.11337710","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvmi66673.2025.11337710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Computer Vision and Machine Intelligence (CVMI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.659512996673584}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1976620775","https://openalex.org/W2044626341","https://openalex.org/W2150220236","https://openalex.org/W2156830856","https://openalex.org/W2160053408","https://openalex.org/W2607579284","https://openalex.org/W2896348597","https://openalex.org/W2995904231","https://openalex.org/W3043220749","https://openalex.org/W3093225449","https://openalex.org/W3098000326","https://openalex.org/W3217211907","https://openalex.org/W4255497883","https://openalex.org/W4319300501","https://openalex.org/W4366123788","https://openalex.org/W4387193636","https://openalex.org/W4387777447","https://openalex.org/W4392902791","https://openalex.org/W4394933221","https://openalex.org/W4396612944","https://openalex.org/W4400977318","https://openalex.org/W4403183405","https://openalex.org/W4405178275","https://openalex.org/W4405521165","https://openalex.org/W4407766431","https://openalex.org/W4407825355","https://openalex.org/W4408258176","https://openalex.org/W4409473986"],"related_works":[],"abstract_inverted_index":{"Image":[0],"captioning":[1,86,150,159],"is":[2],"a":[3,53,81],"challenging":[4],"task":[5],"that":[6,125],"requires":[7],"identifying":[8],"objects,":[9],"attributes,":[10],"and":[11,18,31,64,102,112,115,119],"analyzing":[12],"their":[13],"relationships":[14],"to":[15,43,90],"generate":[16],"accurate":[17],"concise":[19],"textual":[20],"descriptions.":[21],"While":[22],"numerous":[23],"surveys":[24,58],"have":[25,59],"reviewed":[26],"model":[27],"architectures,":[28],"application":[29],"domains,":[30],"evaluation":[32],"methods,":[33],"the":[34,38,46,50,62,77,142,161],"rapid":[35,163],"expansion":[36],"of":[37,49,67,84,141,148],"field":[39],"makes":[40],"it":[41],"difficult":[42],"comprehensively":[44],"capture":[45],"full":[47],"scope":[48],"literature":[51],"in":[52,70,128,135,152],"single":[54],"study.":[55],"Furthermore,":[56],"existing":[57],"not":[60],"addressed":[61],"spatial":[63,101],"temporal":[65,103],"distribution":[66],"research":[68,87,104,146],"activity":[69],"this":[71,75],"domain.":[72],"To":[73],"address":[74],"gap,":[76],"present":[78],"study":[79],"conducts":[80],"scientometric":[82],"analysis":[83],"image":[85,149,158],"from":[88],"2021":[89],"2025.":[91],"It":[92],"provides":[93],"macro-level":[94],"insights":[95],"across":[96],"four":[97],"key":[98],"dimensions:":[99],"(i)":[100],"distribution,":[105],"(ii)":[106],"collaboration":[107],"networks,":[108],"(iii)":[109],"leading":[110],"institutions":[111,147],"publication":[113,129],"venues,":[114],"(iv)":[116],"emerging":[117,155],"trends":[118],"active":[120],"subfields.":[121],"Our":[122],"findings":[123],"reveal":[124],"China":[126],"leads":[127],"output,":[130],"while":[131],"Australia":[132],"ranks":[133],"highest":[134],"average":[136],"citation":[137],"impact.":[138],"Notably,":[139],"nine":[140],"top":[143],"ten":[144],"contributing":[145],"are":[151],"China.":[153],"Among":[154],"subdomains,":[156],"medical":[157],"shows":[160],"most":[162],"growth.":[164]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-01-21T00:00:00"}
