{"id":"https://openalex.org/W7125018988","doi":"https://doi.org/10.1109/cbmi66578.2025.11339337","title":"An Experimental Study on Generating Plausible Textual Explanations for Video Summarization*","display_name":"An Experimental Study on Generating Plausible Textual Explanations for Video Summarization*","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W7125018988","doi":"https://doi.org/10.1109/cbmi66578.2025.11339337"},"language":null,"primary_location":{"id":"doi:10.1109/cbmi66578.2025.11339337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123403892","display_name":"Thomas Eleftheriadis","orcid":null},"institutions":[{"id":"https://openalex.org/I4210093649","display_name":"Information Technologies Institute","ror":"https://ror.org/0069akp70","country_code":"GR","type":"nonprofit","lineage":["https://openalex.org/I4210093649"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"Thomas Eleftheriadis","raw_affiliation_strings":["ITI, CERTH,Thessaloniki,Greece"],"affiliations":[{"raw_affiliation_string":"ITI, CERTH,Thessaloniki,Greece","institution_ids":["https://openalex.org/I4210093649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123415276","display_name":"Evlampios Apostolidis","orcid":null},"institutions":[{"id":"https://openalex.org/I4210093649","display_name":"Information Technologies Institute","ror":"https://ror.org/0069akp70","country_code":"GR","type":"nonprofit","lineage":["https://openalex.org/I4210093649"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Evlampios Apostolidis","raw_affiliation_strings":["ITI, CERTH,Thessaloniki,Greece"],"affiliations":[{"raw_affiliation_string":"ITI, CERTH,Thessaloniki,Greece","institution_ids":["https://openalex.org/I4210093649"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123391564","display_name":"Vasileios Mezaris","orcid":null},"institutions":[{"id":"https://openalex.org/I4210093649","display_name":"Information Technologies Institute","ror":"https://ror.org/0069akp70","country_code":"GR","type":"nonprofit","lineage":["https://openalex.org/I4210093649"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Vasileios Mezaris","raw_affiliation_strings":["ITI, CERTH,Thessaloniki,Greece"],"affiliations":[{"raw_affiliation_string":"ITI, CERTH,Thessaloniki,Greece","institution_ids":["https://openalex.org/I4210093649"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5123403892"],"corresponding_institution_ids":["https://openalex.org/I4210093649"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.70137866,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8537999987602234,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8537999987602234,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.062300000339746475,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0272000003606081,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.7574999928474426},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6773999929428101},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.515999972820282},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.4602000117301941},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.42089998722076416},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.4117000102996826},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.3075000047683716}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79339998960495},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.7574999928474426},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6773999929428101},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6104999780654907},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5565000176429749},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.515999972820282},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.4602000117301941},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.42089998722076416},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.4117000102996826},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.3075000047683716},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.30410000681877136},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.3005000054836273},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.27079999446868896}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cbmi66578.2025.11339337","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339337","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4163844585418701,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1924343884","https://openalex.org/W2031489346","https://openalex.org/W2097117768","https://openalex.org/W2108598243","https://openalex.org/W2516809705","https://openalex.org/W2921802966","https://openalex.org/W3034917890","https://openalex.org/W3119886052","https://openalex.org/W3175950569","https://openalex.org/W3210314917","https://openalex.org/W3216015240","https://openalex.org/W3217619974","https://openalex.org/W4220751672","https://openalex.org/W4255898812","https://openalex.org/W4317791940","https://openalex.org/W4386065706","https://openalex.org/W4387149478","https://openalex.org/W4390190266","https://openalex.org/W4399039063","https://openalex.org/W4401451913","https://openalex.org/W4409917740"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1,23],"paper,":[2],"we":[3,25,58,91,144],"present":[4],"our":[5],"experimental":[6],"study":[7,148],"on":[8,60,134],"generating":[9,182],"plausible":[10,173,183],"textual":[11,109,113,184],"explanations":[12,75,101,168,185],"for":[13,30,67,95,126,159,181,186],"the":[14,20,53,63,70,73,82,88,97,104,112,116,121,135,139,165,171,177],"outcomes":[15],"of":[16,22,33,52,62,72,99,115,123],"video":[17,34,118,160,187],"summarization.":[18,188],"For":[19],"needs":[21],"study,":[24],"extend":[26],"an":[27,93,146],"existing":[28],"framework":[29,137],"multigranular":[31],"explanation":[32],"summarization":[35],"by":[36,102],"integrating":[37],"a":[38,150],"SOTA":[39,151],"Large":[40],"Multimodal":[41],"Model":[42],"(LLaVA-OneVision)":[43],"and":[44,85,111,138,154,175],"prompting":[45],"it":[46],"to":[47,162],"produce":[48],"natural":[49],"language":[50],"descriptions":[51,110,114],"obtained":[54,74],"visual":[55,100],"explanations.":[56],"Following,":[57],"focus":[59],"one":[61],"most":[64,178],"desired":[65],"characteristics":[66],"explainable":[68],"AI,":[69],"plausibility":[71,98,141],"that":[76],"relates":[77],"with":[78,81,120],"their":[79,108],"alignment":[80],"humans'":[83],"reasoning":[84],"expectations.":[86],"Using":[87],"extended":[89,136],"framework,":[90],"propose":[92],"approach":[94,180],"evaluating":[96],"quantifying":[103],"semantic":[105],"overlap":[106],"between":[107],"corresponding":[117],"summaries,":[119],"help":[122],"two":[124,155],"methods":[125],"creating":[127],"sentence":[128],"embed":[129],"dings":[130],"(SBERT,":[131],"SimCSE).":[132],"Based":[133],"proposed":[140],"evaluation":[142],"approach,":[143],"conduct":[145],"exper-imental":[147],"using":[149],"method":[152],"(CA-SUM)":[153],"datasets":[156],"(SumMe,":[157],"TVSum)":[158],"summarization,":[161],"examine":[163],"whether":[164],"more":[166,172],"faithful":[167],"are":[169],"also":[170],"ones,":[174],"identify":[176],"appropriate":[179]},"counts_by_year":[],"updated_date":"2026-01-22T23:29:09.771500","created_date":"2026-01-21T00:00:00"}
