{"id":"https://openalex.org/W4390909471","doi":"https://doi.org/10.1186/s40537-024-00878-w","title":"Bilingual video captioning model for enhanced video retrieval","display_name":"Bilingual video captioning model for enhanced video retrieval","publication_year":2024,"publication_date":"2024-01-16","ids":{"openalex":"https://openalex.org/W4390909471","doi":"https://doi.org/10.1186/s40537-024-00878-w"},"language":"en","primary_location":{"id":"doi:10.1186/s40537-024-00878-w","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00878-w","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00878-w","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00878-w","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039139632","display_name":"Norah Alrebdi","orcid":null},"institutions":[{"id":"https://openalex.org/I156216236","display_name":"Qassim University","ror":"https://ror.org/01wsfe280","country_code":"SA","type":"education","lineage":["https://openalex.org/I156216236"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Norah Alrebdi","raw_affiliation_strings":["Department of Information Technology, College of Computer, Qassim University, 51452, Buraydah, Saudi Arabia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Technology, College of Computer, Qassim University, 51452, Buraydah, Saudi Arabia","institution_ids":["https://openalex.org/I156216236"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013171598","display_name":"Amal A. Al-Shargabi","orcid":"https://orcid.org/0000-0002-7312-9003"},"institutions":[{"id":"https://openalex.org/I156216236","display_name":"Qassim University","ror":"https://ror.org/01wsfe280","country_code":"SA","type":"education","lineage":["https://openalex.org/I156216236"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Amal A. Al-Shargabi","raw_affiliation_strings":["Department of Information Technology, College of Computer, Qassim University, 51452, Buraydah, Saudi Arabia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Information Technology, College of Computer, Qassim University, 51452, Buraydah, Saudi Arabia","institution_ids":["https://openalex.org/I156216236"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5039139632"],"corresponding_institution_ids":["https://openalex.org/I156216236"],"apc_list":{"value":1060,"currency":"GBP","value_usd":1300},"apc_paid":{"value":1060,"currency":"GBP","value_usd":1300},"fwci":2.0194,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.87041079,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"11","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9894000291824341,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9297467470169067},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.9094748497009277},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.56183260679245},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5456058382987976},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.527150571346283},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.46653443574905396},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.452149897813797},{"id":"https://openalex.org/keywords/video-quality","display_name":"Video quality","score":0.44767606258392334},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.44179341197013855},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4128960967063904},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.37025365233421326},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.20610427856445312}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9297467470169067},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9094748497009277},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.56183260679245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5456058382987976},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.527150571346283},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.46653443574905396},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.452149897813797},{"id":"https://openalex.org/C103910844","wikidata":"https://www.wikidata.org/wiki/Q2631256","display_name":"Video quality","level":3,"score":0.44767606258392334},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.44179341197013855},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4128960967063904},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.37025365233421326},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.20610427856445312},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1186/s40537-024-00878-w","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00878-w","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00878-w","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:44689cda5f6848818bb702d03d1eaeaa","is_oa":true,"landing_page_url":"https://doaj.org/article/44689cda5f6848818bb702d03d1eaeaa","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Big Data, Vol 11, Iss 1, Pp 1-24 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1186/s40537-024-00878-w","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s40537-024-00878-w","pdf_url":"https://journalofbigdata.springeropen.com/counter/pdf/10.1186/s40537-024-00878-w","source":{"id":"https://openalex.org/S2737955091","display_name":"Journal Of Big Data","issn_l":"2196-1115","issn":["2196-1115"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Big Data","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6499999761581421,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320324403","display_name":"Qassim University","ror":"https://ror.org/01wsfe280"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4390909471.pdf"},"referenced_works_count":47,"referenced_works":["https://openalex.org/W877909479","https://openalex.org/W1586939924","https://openalex.org/W1588719663","https://openalex.org/W1663984431","https://openalex.org/W1956340063","https://openalex.org/W1973965874","https://openalex.org/W1978394996","https://openalex.org/W2064675550","https://openalex.org/W2097606805","https://openalex.org/W2101105183","https://openalex.org/W2125707784","https://openalex.org/W2133665775","https://openalex.org/W2152984213","https://openalex.org/W2163636861","https://openalex.org/W2164290393","https://openalex.org/W2194775991","https://openalex.org/W2613052503","https://openalex.org/W2765811365","https://openalex.org/W2793959159","https://openalex.org/W2887712318","https://openalex.org/W2964241990","https://openalex.org/W2990045262","https://openalex.org/W3009192917","https://openalex.org/W3035112208","https://openalex.org/W3038017128","https://openalex.org/W3087632114","https://openalex.org/W3095591473","https://openalex.org/W3122132232","https://openalex.org/W3132880751","https://openalex.org/W3151123052","https://openalex.org/W3153565615","https://openalex.org/W3163971663","https://openalex.org/W3175065555","https://openalex.org/W3179529441","https://openalex.org/W3188533866","https://openalex.org/W3196336622","https://openalex.org/W3198212100","https://openalex.org/W3207317116","https://openalex.org/W3216659302","https://openalex.org/W4211045496","https://openalex.org/W4212903594","https://openalex.org/W4213152894","https://openalex.org/W4286610731","https://openalex.org/W4289435181","https://openalex.org/W4311412445","https://openalex.org/W4311424438","https://openalex.org/W6797674293"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W4388002133","https://openalex.org/W3173149175","https://openalex.org/W2170297402","https://openalex.org/W2276021436","https://openalex.org/W2561364921","https://openalex.org/W3199673414","https://openalex.org/W2118568109","https://openalex.org/W2057320948","https://openalex.org/W2104411120"],"abstract_inverted_index":{"Abstract":[0],"Many":[1],"video":[2,12,23,41,59,69,172,189,223,252],"platforms":[3],"rely":[4],"on":[5,129],"the":[6,121,178,199,210,222,225,236],"descriptions":[7],"that":[8,72,177],"uploaders":[9],"provide":[10],"for":[11,95,140,171],"retrieval.":[13,173,190],"However,":[14],"this":[15,27],"reliance":[16],"may":[17],"cause":[18],"inaccuracies.":[19],"Although":[20],"deep":[21],"learning-based":[22],"captioning":[24,60,70],"can":[25],"resolve":[26],"problem,":[28],"it":[29],"has":[30],"some":[31],"limitations:":[32],"(1)":[33],"traditional":[34],"keyframe":[35,76,87],"extraction":[36,77,88],"techniques":[37],"do":[38],"not":[39,62],"consider":[40],"length/content,":[42],"resulting":[43],"in":[44,58,119,247],"low":[45],"accuracy,":[46],"high":[47],"storage":[48,100],"requirements,":[49,102],"and":[50,79,83,92,103,108,123,154,188,197,206,217,227,233,251],"long":[51,116],"processing":[52],"times;":[53],"(2)":[54],"Arabic":[55,82,109,211,228],"language":[56],"support":[57],"is":[61],"extensive.":[63],"This":[64],"study":[65],"proposes":[66],"a":[67,112],"new":[68],"approach":[71],"uses":[73,90],"an":[74],"efficient":[75],"method":[78],"supports":[80],"both":[81,120],"English.":[84],"The":[85,106,174],"proposed":[86],"technique":[89],"time-":[91],"content-based":[93],"approaches":[94],"better":[96,182],"quality":[97,131,187],"captions,":[98],"fewer":[99],"space":[101],"faster":[104],"processing.":[105],"English":[107,179,200,226],"models":[110,126,229,243],"use":[111],"sequence-to-sequence":[113],"framework":[114],"with":[115,144,183,239],"short-term":[117],"memory":[118],"encoder":[122],"decoder.":[124],"Both":[125],"were":[127,161],"evaluated":[128,163],"caption":[130,186],"using":[132,164],"four":[133],"metrics:":[134],"bilingual":[135],"evaluation":[136,141,152,158],"understudy":[137,149],"(BLEU),":[138],"metric":[139],"of":[142,150,193,235],"translation":[143],"explicit":[145],"ORdering":[146],"(METEOR),":[147],"recall-oriented":[148],"gisting":[151],"(ROUGE-L),":[153],"consensus-based":[155],"image":[156],"description":[157],"(CIDE-r).":[159],"They":[160],"also":[162],"cosine":[165],"similarity":[166],"to":[167,185,221],"determine":[168],"their":[169],"suitability":[170],"results":[175],"demonstrated":[176],"model":[180,201,212],"performed":[181],"regards":[184],"In":[191],"terms":[192],"BLEU,":[194],"METEOR,":[195],"ROUGE-L,":[196],"CIDE-r,":[198],"scored":[202,213],"47.18,":[203],"30.46,":[204],"62.07,":[205],"59.98,":[207],"respectively,":[208,238],"whereas":[209],"21.65,":[214],"36.30,":[215],"44.897,":[216],"45.52,":[218],"respectively.":[219],"According":[220],"retrieval,":[224],"successfully":[230],"retrieved":[231],"67%":[232],"40%":[234],"videos,":[237],"20%":[240],"similarity.":[241],"These":[242],"have":[244],"potential":[245],"applications":[246],"storytelling,":[248],"sports":[249],"commentaries,":[250],"surveillance.":[253]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":5}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
