{"id":"https://openalex.org/W4211045496","doi":"https://doi.org/10.1186/s40537-022-00569-4","title":"Semantic context driven language descriptions of videos using deep neural network","display_name":"Semantic context driven language descriptions of videos using deep neural network","publication_year":2022,"publication_date":"2022-02-10","ids":{"openalex":"https://openalex.org/W4211045496","doi":"https://doi.org/10.1186/s40537-022-00569-4"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-022-00569-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00569-4","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-022-00569-4","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-022-00569-4","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037889655","display_name":"Dinesh Naik","orcid":"https://orcid.org/0000-0002-8989-6282"},"institutions":[{"id":"https://openalex.org/I11880225","display_name":"National Institute of Technology Karnataka","ror":"https://ror.org/01hz4v948","country_code":"IN","type":"education","lineage":["https://openalex.org/I11880225"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Dinesh Naik","raw_affiliation_strings":["Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India"],"raw_orcid":"https://orcid.org/0000-0002-8989-6282","affiliations":[{"raw_affiliation_string":"Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India","institution_ids":["https://openalex.org/I11880225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054016512","display_name":"C. D. Jaidhar","orcid":null},"institutions":[{"id":"https://openalex.org/I11880225","display_name":"National Institute of Technology Karnataka","ror":"https://ror.org/01hz4v948","country_code":"IN","type":"education","lineage":["https://openalex.org/I11880225"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"C. D. Jaidhar","raw_affiliation_strings":["Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Technology, National Institute of Technology Karnataka, Surathkal, Mangalore, 575025, India","institution_ids":["https://openalex.org/I11880225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5037889655"],"corresponding_institution_ids":["https://openalex.org/I11880225"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":0.7108,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.69069009,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"9","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9146289229393005},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.8226579427719116},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6069815158843994},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5935887694358826},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.583362340927124},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5352874994277954},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.525192379951477},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5189173221588135},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4852013885974884},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4664183557033539},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4552319645881653},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.45062756538391113},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4483187198638916},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43337833881378174},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4125828742980957},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.218307226896286}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9146289229393005},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.8226579427719116},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6069815158843994},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5935887694358826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.583362340927124},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5352874994277954},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.525192379951477},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5189173221588135},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4852013885974884},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4664183557033539},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4552319645881653},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.45062756538391113},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4483187198638916},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43337833881378174},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4125828742980957},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.218307226896286},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-022-00569-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00569-4","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-022-00569-4","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:969989432f1248938c16889dfa2de86e","is_oa":true,"landing_page_url":"https://doaj.org/article/969989432f1248938c16889dfa2de86e","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 9, Iss 1, Pp 1-22 (2022)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-022-00569-4","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-022-00569-4","pdf_url":"https://journalofbigdata.springeropen.com/track/pdf/10.1186/s40537-022-00569-4","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7599999904632568,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4211045496.pdf","grobid_xml":"https://content.openalex.org/works/W4211045496.grobid-xml"},"referenced_works_count":54,"referenced_works":["https://openalex.org/W1573040851","https://openalex.org/W1586939924","https://openalex.org/W1895577753","https://openalex.org/W1931639407","https://openalex.org/W1956340063","https://openalex.org/W2064675550","https://openalex.org/W2080672747","https://openalex.org/W2101105183","https://openalex.org/W2139501017","https://openalex.org/W2164290393","https://openalex.org/W2183341477","https://openalex.org/W2250539671","https://openalex.org/W2302086703","https://openalex.org/W2506483933","https://openalex.org/W2523993696","https://openalex.org/W2557264465","https://openalex.org/W2731627339","https://openalex.org/W2739107216","https://openalex.org/W2765658575","https://openalex.org/W2766375149","https://openalex.org/W2803620531","https://openalex.org/W2808203533","https://openalex.org/W2887712318","https://openalex.org/W2888798257","https://openalex.org/W2900626451","https://openalex.org/W2901292676","https://openalex.org/W2907342958","https://openalex.org/W2908356592","https://openalex.org/W2914306086","https://openalex.org/W2941825186","https://openalex.org/W2945223572","https://openalex.org/W2953461088","https://openalex.org/W2962861647","https://openalex.org/W2963341956","https://openalex.org/W2963552819","https://openalex.org/W2963576560","https://openalex.org/W2963843052","https://openalex.org/W2964081807","https://openalex.org/W2964167369","https://openalex.org/W2964241990","https://openalex.org/W2979437663","https://openalex.org/W2998637494","https://openalex.org/W2999226135","https://openalex.org/W3022304420","https://openalex.org/W3046652249","https://openalex.org/W3094125946","https://openalex.org/W3098682680","https://openalex.org/W3128484727","https://openalex.org/W3140854437","https://openalex.org/W3191137294","https://openalex.org/W3197863338","https://openalex.org/W3197878906","https://openalex.org/W3202435008","https://openalex.org/W4229942105"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W3088136942","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4290852288","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W3009270862"],"abstract_inverted_index":{"Abstract":[0],"The":[1,127,153,173,196,240],"massive":[2],"addition":[3],"of":[4,26,175,230,250,253],"data":[5,22,28],"to":[6,47,122,133,165,208],"the":[7,20,76,89,101,112,119,124,131,142,163,171,176,182,201,209,213,228,251,254],"internet":[8],"in":[9,19,31,40,242,258],"text,":[10],"images,":[11],"and":[12,29,68,78,135,140,145,156,225,234,237],"videos":[13],"made":[14],"computer":[15,41],"vision-based":[16],"tasks":[17],"challenging":[18],"big":[21],"domain.":[23],"Recent":[24],"exploration":[25],"video":[27,102,183],"progress":[30],"visual":[32,49,113,143,154],"information":[33,50],"captioning":[34,44,184],"has":[35],"been":[36],"an":[37,58,79,84],"arduous":[38],"task":[39],"vision.":[42],"Visual":[43,96],"is":[45,179],"attributable":[46],"integrating":[48],"with":[51,61,83,91,227],"natural":[52,167],"language":[53,146],"descriptions.":[54],"This":[55],"paper":[56],"proposes":[57],"encoder-decoder":[59],"framework":[60,178,203],"a":[62,92,105,246],"2D-Convolutional":[63],"Neural":[64],"Network":[65],"(CNN)":[66],"model":[67,81,107,215],"layered":[69,120],"Long":[70],"Short":[71],"Term":[72],"Memory":[73],"(LSTM)":[74],"as":[75,88],"encoder":[77],"LSTM":[80,121],"integrated":[82],"attention":[85,128],"mechanism":[86,129],"working":[87],"decoder":[90,132,164],"hybrid":[93],"loss":[94],"function.":[95],"feature":[97,114],"vectors":[98,115],"extracted":[99],"from":[100],"frames":[103],"using":[104,191],"2D-CNN":[106],"capture":[108,123],"spatial":[109],"features.":[110],"Specifically,":[111],"are":[116,160],"fed":[117],"into":[118,162],"temporal":[125],"information.":[126],"enables":[130],"perceive":[134],"focus":[136],"on":[137,181],"relevant":[138],"objects":[139],"correlate":[141],"context":[144,252],"content":[147],"for":[148,170],"producing":[149],"semantically":[150],"correct":[151],"captions.":[152],"features":[155],"GloVe":[157],"word":[158],"embeddings":[159],"input":[161],"generate":[166],"semantic":[168],"descriptions":[169],"videos.":[172],"performance":[174],"proposed":[177,214],"evaluated":[180],"benchmark":[185],"dataset":[186],"Microsoft":[187],"Video":[188],"Description":[189],"(MSVD)":[190],"various":[192],"well-known":[193],"evaluation":[194],"metrics.":[195],"experimental":[197],"findings":[198],"indicate":[199],"that":[200],"suggested":[202],"outperforms":[204],"state-of-the-art":[205,210],"techniques.":[206],"Compared":[207],"research":[211],"methods,":[212],"significantly":[216],"increased":[217],"all":[218,243],"measures,":[219],"B@1,":[220],"B@2,":[221],"B@3,":[222],"B@4,":[223],"METEOR,":[224],"CIDEr,":[226],"score":[229],"78.4,":[231],"64.8,":[232],"54.2,":[233],"43.7,":[235],"32.3,":[236],"70.7,":[238],"respectively.":[239],"progression":[241],"scores":[244],"indicates":[245],"more":[247,259],"excellent":[248],"grasp":[249],"inputs,":[255],"which":[256],"results":[257],"accurate":[260],"caption":[261],"prediction.":[262]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
