{"id":"https://openalex.org/W4404032110","doi":"https://doi.org/10.1109/icccnt61001.2024.10724799","title":"Integrating Convolutional and Recurrent Networks for Image Caption Generation: A Unified Approach","display_name":"Integrating Convolutional and Recurrent Networks for Image Caption Generation: A Unified Approach","publication_year":2024,"publication_date":"2024-06-24","ids":{"openalex":"https://openalex.org/W4404032110","doi":"https://doi.org/10.1109/icccnt61001.2024.10724799"},"language":"en","primary_location":{"id":"doi:10.1109/icccnt61001.2024.10724799","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt61001.2024.10724799","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 15th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036002274","display_name":"I Nandhini","orcid":null},"institutions":[{"id":"https://openalex.org/I1330855593","display_name":"Vel Tech Rangarajan Dr. Sagunthala R&D Institute of Science and Technology","ror":"https://ror.org/05bc5bx80","country_code":"IN","type":"education","lineage":["https://openalex.org/I1330855593"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"I Nandhini","raw_affiliation_strings":["Vel Tech Rangarajan Dr. Sagunthala R&#x0026;D Institute of Science and Technology,Department of Electronics &#x0026; Communication Engineering,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Vel Tech Rangarajan Dr. Sagunthala R&#x0026;D Institute of Science and Technology,Department of Electronics &#x0026; Communication Engineering,Chennai,India","institution_ids":["https://openalex.org/I1330855593"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069732323","display_name":"L. Prasanth","orcid":null},"institutions":[{"id":"https://openalex.org/I33585257","display_name":"Anna University, Chennai","ror":"https://ror.org/01qhf1r47","country_code":"IN","type":"education","lineage":["https://openalex.org/I33585257"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"L Leo Prasanth","raw_affiliation_strings":["Anna University,Research Scholar Department of Information Science and Technology,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Anna University,Research Scholar Department of Information Science and Technology,Chennai,India","institution_ids":["https://openalex.org/I33585257"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108910634","display_name":"T. J. Nagalakshmi","orcid":null},"institutions":[{"id":"https://openalex.org/I1330855593","display_name":"Vel Tech Rangarajan Dr. Sagunthala R&D Institute of Science and Technology","ror":"https://ror.org/05bc5bx80","country_code":"IN","type":"education","lineage":["https://openalex.org/I1330855593"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"T Nagalakshmi","raw_affiliation_strings":["Vel Tech Rangarajan Dr. Sagunthala R&#x0026;D Institute of Science and Technology,Department of Mathematics,Chennai,India"],"affiliations":[{"raw_affiliation_string":"Vel Tech Rangarajan Dr. Sagunthala R&#x0026;D Institute of Science and Technology,Department of Mathematics,Chennai,India","institution_ids":["https://openalex.org/I1330855593"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109245174","display_name":"D. Manjula","orcid":null},"institutions":[{"id":"https://openalex.org/I876193797","display_name":"Vellore Institute of Technology University","ror":"https://ror.org/00qzypv28","country_code":"IN","type":"education","lineage":["https://openalex.org/I876193797"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"D Manjula","raw_affiliation_strings":["VIT University,Department of Computer Science and Engineering,Chennai,India"],"affiliations":[{"raw_affiliation_string":"VIT University,Department of Computer Science and Engineering,Chennai,India","institution_ids":["https://openalex.org/I876193797"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5036002274"],"corresponding_institution_ids":["https://openalex.org/I1330855593"],"apc_list":null,"apc_paid":null,"fwci":0.7873,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.74104241,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7791224718093872},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5081291198730469},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47167807817459106},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4413437843322754},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.39513829350471497}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7791224718093872},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5081291198730469},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47167807817459106},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4413437843322754},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39513829350471497}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icccnt61001.2024.10724799","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icccnt61001.2024.10724799","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 15th International Conference on Computing Communication and Networking Technologies (ICCCNT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2745461083","https://openalex.org/W2901218576","https://openalex.org/W2969862959","https://openalex.org/W2997591391","https://openalex.org/W3216130706","https://openalex.org/W4362566211","https://openalex.org/W4367674159","https://openalex.org/W4386162736","https://openalex.org/W4387328751","https://openalex.org/W4389491872","https://openalex.org/W6745537798","https://openalex.org/W6789753369"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Within":[0],"the":[1,10,44,56,69,78,115,136,175,183,190],"realm":[2],"of":[3,58,68,105,107,124,138,177],"natural":[4,85],"language":[5],"processing":[6],"and":[7,17,40,60,77,98,121,153,185],"computer":[8],"vision,":[9],"synergy":[11],"between":[12],"Convolutional":[13],"Neural":[14],"Networks":[15],"(CNN)":[16],"Long":[18],"Short-Term":[19],"Memory":[20],"(LSTM)":[21],"systems":[22],"has":[23],"emerged":[24],"as":[25],"some":[26],"powerful":[27],"paradigm":[28],"for":[29,38],"image":[30,45,101,125],"captioning.":[31],"This":[32],"paper":[33],"presents":[34],"a":[35,50,111],"comprehensive":[36],"solution":[37],"visual":[39,184],"temporal":[41,122,186],"understanding":[42],"in":[43,75,84,96],"captioning":[46,150],"domain":[47],"by":[48,73,82,189],"presenting":[49],"unified":[51],"framework":[52],"that":[53],"efficiently":[54,90],"blends":[55],"strengths":[57],"CNN":[59,88],"LSTM":[61],"architectures.":[62],"Our":[63,146,156],"proposed":[64,157],"model":[65,158],"takes":[66],"advantage":[67],"spatial":[70,120],"hierarchies":[71],"captured":[72],"CNNs":[74],"images":[76],"sequential":[79],"dependencies":[80],"modeled":[81],"LSTMs":[83],"language.":[86],"The":[87,103],"component":[89],"retrieves":[91],"high-degree":[92],"features":[93],"to":[94],"result":[95],"coherent":[97],"contextually":[99],"rich":[100],"captions.":[102],"hybridization":[104],"both":[106,119],"these":[108],"networks":[109],"creates":[110],"symbiotic":[112],"relationship,":[113],"addressing":[114],"challenges":[116],"associated":[117],"with":[118,168],"aspects":[123],"interpretation.":[126],"We":[127],"carried":[128],"out":[129],"in-depth":[130],"tests":[131],"on":[132,182],"benchmark":[133],"datasets,":[134],"demonstrating":[135],"superiority":[137],"our":[139,178],"hybrid":[140,191],"CNN-LSTM":[141],"architecture":[142],"over":[143],"standalone":[144],"models.":[145],"results":[147],"showcase":[148],"improved":[149],"exactness,":[151],"fluency,":[152],"contextual":[154],"relevance.":[155],"achieved":[159],"highest":[160],"BLEU":[161],"score":[162],"$\\mathbf{0.":[163],"8":[164],"1}$":[165],"when":[166],"compared":[167],"existing":[169],"methods.":[170],"In":[171],"addition,":[172],"we":[173],"investigated":[174],"interpretability":[176],"model,":[179],"shedding":[180],"light":[181],"cues":[187],"learned":[188],"architecture.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
