{"id":"https://openalex.org/W4413980963","doi":"https://doi.org/10.1007/s11263-025-02577-2","title":"Language-guided Recursive Spatiotemporal Graph Modeling for Video Summarization","display_name":"Language-guided Recursive Spatiotemporal Graph Modeling for Video Summarization","publication_year":2025,"publication_date":"2025-09-04","ids":{"openalex":"https://openalex.org/W4413980963","doi":"https://doi.org/10.1007/s11263-025-02577-2"},"language":"en","primary_location":{"id":"doi:10.1007/s11263-025-02577-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-025-02577-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-025-02577-2.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11263-025-02577-2.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067272515","display_name":"Jungin Park","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jungin Park","raw_affiliation_strings":["Yonsei University, Seoul, Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University, Seoul, Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100447461","display_name":"Jiyoung Lee","orcid":"https://orcid.org/0000-0003-0840-3317"},"institutions":[{"id":"https://openalex.org/I138925566","display_name":"Ewha Womans University","ror":"https://ror.org/053fp5c05","country_code":"KR","type":"education","lineage":["https://openalex.org/I138925566"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jiyoung Lee","raw_affiliation_strings":["Ewha Womans University, Seoul, Korea"],"affiliations":[{"raw_affiliation_string":"Ewha Womans University, Seoul, Korea","institution_ids":["https://openalex.org/I138925566"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073320959","display_name":"Kwanghoon Sohn","orcid":"https://orcid.org/0000-0002-3715-0331"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]},{"id":"https://openalex.org/I58716616","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883","country_code":"KR","type":"facility","lineage":["https://openalex.org/I27494661","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098","https://openalex.org/I4387152098","https://openalex.org/I58716616"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kwanghoon Sohn","raw_affiliation_strings":["Korea Institute of Science and Technology (KIST), Seoul, Korea","Yonsei University, Seoul, Korea"],"affiliations":[{"raw_affiliation_string":"Korea Institute of Science and Technology (KIST), Seoul, Korea","institution_ids":["https://openalex.org/I58716616"]},{"raw_affiliation_string":"Yonsei University, Seoul, Korea","institution_ids":["https://openalex.org/I193775966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100447461"],"corresponding_institution_ids":["https://openalex.org/I138925566"],"apc_list":{"value":2890,"currency":"EUR","value_usd":3690},"apc_paid":{"value":2890,"currency":"EUR","value_usd":3690},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.22105605,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"133","issue":"12","first_page":"8617","last_page":"8641"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8517329692840576},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7175862789154053},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5769020915031433},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5529765486717224},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.491131991147995},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3489380180835724},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3452335596084595},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3217198848724365}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8517329692840576},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7175862789154053},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5769020915031433},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5529765486717224},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.491131991147995},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3489380180835724},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3452335596084595},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3217198848724365}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s11263-025-02577-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-025-02577-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-025-02577-2.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2509.05604","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.05604","pdf_url":"https://arxiv.org/pdf/2509.05604","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1007/s11263-025-02577-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11263-025-02577-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11263-025-02577-2.pdf","source":{"id":"https://openalex.org/S25538012","display_name":"International Journal of Computer Vision","issn_l":"0920-5691","issn":["0920-5691","1573-1405"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Computer Vision","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1200101808","display_name":null,"funder_award_id":"RS-2025-00515741","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G176378680","display_name":null,"funder_award_id":"2024-22-0161","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G3034753964","display_name":null,"funder_award_id":"grant","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G342704958","display_name":null,"funder_award_id":"funded","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G4875422403","display_name":null,"funder_award_id":"2024-22-0161","funder_id":"https://openalex.org/F4320321314","funder_display_name":"Yonsei University"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320321314","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4413980963.pdf","grobid_xml":"https://content.openalex.org/works/W4413980963.grobid-xml"},"referenced_works_count":82,"referenced_works":["https://openalex.org/W333230188","https://openalex.org/W1598774275","https://openalex.org/W1904325426","https://openalex.org/W1924343884","https://openalex.org/W1948812921","https://openalex.org/W1979354511","https://openalex.org/W1987366351","https://openalex.org/W1991750682","https://openalex.org/W2003553461","https://openalex.org/W2032342062","https://openalex.org/W2097117768","https://openalex.org/W2120645068","https://openalex.org/W2126802797","https://openalex.org/W2139009685","https://openalex.org/W2194775991","https://openalex.org/W2277195237","https://openalex.org/W2412782625","https://openalex.org/W2517959782","https://openalex.org/W2529272619","https://openalex.org/W2612624696","https://openalex.org/W2737677090","https://openalex.org/W2745461083","https://openalex.org/W2756203131","https://openalex.org/W2766630207","https://openalex.org/W2781922022","https://openalex.org/W2798970487","https://openalex.org/W2806331055","https://openalex.org/W2895758197","https://openalex.org/W2900393952","https://openalex.org/W2903758693","https://openalex.org/W2906502833","https://openalex.org/W2948058585","https://openalex.org/W2948246283","https://openalex.org/W2948729509","https://openalex.org/W2954137266","https://openalex.org/W2963076818","https://openalex.org/W2963091558","https://openalex.org/W2963165299","https://openalex.org/W2963220254","https://openalex.org/W2963441581","https://openalex.org/W2963474899","https://openalex.org/W2963508075","https://openalex.org/W2963919999","https://openalex.org/W2964158702","https://openalex.org/W2964167369","https://openalex.org/W2967038491","https://openalex.org/W2967219836","https://openalex.org/W2971168492","https://openalex.org/W2981385984","https://openalex.org/W2982294548","https://openalex.org/W2982672255","https://openalex.org/W2986407524","https://openalex.org/W2994107668","https://openalex.org/W3010309142","https://openalex.org/W3025569967","https://openalex.org/W3025796084","https://openalex.org/W3034681945","https://openalex.org/W3035252826","https://openalex.org/W3035365026","https://openalex.org/W3035392611","https://openalex.org/W3035590142","https://openalex.org/W3035605030","https://openalex.org/W3093411241","https://openalex.org/W3098699623","https://openalex.org/W3099141824","https://openalex.org/W3103720336","https://openalex.org/W3107128832","https://openalex.org/W3107252718","https://openalex.org/W3167092180","https://openalex.org/W3168126734","https://openalex.org/W3193902142","https://openalex.org/W3203711169","https://openalex.org/W4200630194","https://openalex.org/W4224920450","https://openalex.org/W4226103007","https://openalex.org/W4230270698","https://openalex.org/W4304080820","https://openalex.org/W4312632488","https://openalex.org/W4312748990","https://openalex.org/W4319300227","https://openalex.org/W4386076413","https://openalex.org/W4411245187"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2973759123","https://openalex.org/W1517524280"],"abstract_inverted_index":{"Abstract":[0],"Video":[1],"summarization":[2,88,203],"aims":[3],"to":[4,47,81,164,175],"select":[5],"keyframes":[6],"that":[7],"are":[8,43,78,125],"visually":[9],"diverse":[10],"and":[11,109,116,127,179,200,207],"can":[12],"represent":[13],"the":[14,48,52,76,107,114,133,137,141,155,158],"whole":[15],"story":[16],"of":[17,51,68,113],"a":[18,31,64,90,172,186],"given":[19],"video.":[20,53],"Previous":[21],"approaches":[22],"have":[23],"focused":[24],"on":[25,195],"global":[26],"interlinkability":[27],"between":[28,136],"frames":[29,110],"in":[30,122,204],"video":[32,56,87,156,202],"by":[33],"temporal":[34,117],"modeling.":[35],"However,":[36],"fine-grained":[37],"visual":[38,147],"entities,":[39],"such":[40],"as":[41,89,111,185],"objects,":[42],"also":[44],"highly":[45],"related":[46,80],"main":[49],"content":[50],"Moreover,":[54],"language-guided":[55,91],"summarization,":[57],"which":[58,105],"has":[59],"recently":[60],"been":[61],"studied,":[62],"requires":[63],"comprehensive":[65],"linguistic":[66],"understanding":[67],"complex":[69],"real-world":[70],"videos.":[71],"To":[72,139],"consider":[73],"how":[74],"all":[75],"objects":[77,108],"semantically":[79],"each":[82,123,182],"other,":[83],"this":[84],"paper":[85],"regards":[86],"spatiotemporal":[92,99],"graph":[93,100,124,130,159],"modeling":[94],"problem.":[95],"We":[96],"present":[97],"recursive":[98,173],"networks,":[101],"called":[102],"VideoGraph":[103,191],",":[104],"formulate":[106],"nodes":[112,121],"spatial":[115],"graphs,":[118],"respectively.":[119],"The":[120,210],"connected":[126],"aggregated":[128],"with":[129,146],"edges,":[131],"representing":[132],"semantic":[134,166],"relationships":[135],"nodes.":[138],"prevent":[140],"edges":[142],"from":[143,154],"being":[144],"configured":[145],"similarity,":[148],"we":[149,170],"incorporate":[150],"language":[151],"queries":[152],"derived":[153],"into":[157],"node":[160,184],"representations,":[161],"enabling":[162],"them":[163],"contain":[165],"knowledge.":[167],"In":[168,188],"addition,":[169],"adopt":[171],"strategy":[174],"refine":[176],"initial":[177],"graphs":[178],"correctly":[180],"classify":[181],"frame":[183],"keyframe.":[187],"our":[189],"experiments,":[190],"achieves":[192],"state-of-the-art":[193],"performance":[194],"several":[196],"benchmarks":[197],"for":[198],"generic":[199],"query-focused":[201],"both":[205],"supervised":[206],"unsupervised":[208],"manners.":[209],"code":[211],"is":[212],"available":[213],"at":[214],"https://github.com/park-jungin/videograph":[215],".":[216]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
