{"id":"https://openalex.org/W4402352579","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651314","title":"Semantic Fusion Based Graph Network for Video Scene Detection","display_name":"Semantic Fusion Based Graph Network for Video Scene Detection","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402352579","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651314"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10651314","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651314","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5024018042","display_name":"Ye Tian","orcid":"https://orcid.org/0000-0002-3428-1889"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tian Ye","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103009087","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-9224-3277"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101690665","display_name":"Mengyu Yang","orcid":"https://orcid.org/0000-0001-7832-0926"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyu Yang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051221338","display_name":"Lanshan Zhang","orcid":"https://orcid.org/0000-0002-0674-7864"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"LanShan Zhang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040201203","display_name":"Zhigang Li","orcid":"https://orcid.org/0000-0003-1943-9999"},"institutions":[{"id":"https://openalex.org/I23171815","display_name":"Zhengzhou University of Light Industry","ror":"https://ror.org/05fwr8z16","country_code":"CN","type":"education","lineage":["https://openalex.org/I23171815"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhigang Li","raw_affiliation_strings":["Zhengzhou University of Light Industry,Zhengzhou,China"],"affiliations":[{"raw_affiliation_string":"Zhengzhou University of Light Industry,Zhengzhou,China","institution_ids":["https://openalex.org/I23171815"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5024018042"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14609876,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"32","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7585705518722534},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5295642018318176},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.495552659034729},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.42177414894104004},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.17011356353759766}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7585705518722534},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5295642018318176},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.495552659034729},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.42177414894104004},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.17011356353759766}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10651314","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651314","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334111","display_name":"Innovation Fund","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W2132579158","https://openalex.org/W2151617679","https://openalex.org/W2194775991","https://openalex.org/W2488838104","https://openalex.org/W2528841789","https://openalex.org/W2567251966","https://openalex.org/W2598967697","https://openalex.org/W2732026016","https://openalex.org/W2771870130","https://openalex.org/W2793722489","https://openalex.org/W2808531442","https://openalex.org/W2890234794","https://openalex.org/W2950467135","https://openalex.org/W2954585581","https://openalex.org/W2955389138","https://openalex.org/W2962711930","https://openalex.org/W2963066159","https://openalex.org/W2972317931","https://openalex.org/W3003393086","https://openalex.org/W3003652270","https://openalex.org/W3022850065","https://openalex.org/W3034623254","https://openalex.org/W3082069042","https://openalex.org/W3089957576","https://openalex.org/W3093019345","https://openalex.org/W3099032148","https://openalex.org/W3107241266","https://openalex.org/W3111800901","https://openalex.org/W3128384204","https://openalex.org/W3158005556","https://openalex.org/W3170011646","https://openalex.org/W3173459793","https://openalex.org/W4214887514","https://openalex.org/W4293327715","https://openalex.org/W4385701385","https://openalex.org/W4387968052","https://openalex.org/W4391769767","https://openalex.org/W6765133443","https://openalex.org/W6767288045","https://openalex.org/W6842727381"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Video":[0,27,176],"scene":[1,28,118,194],"detection,":[2],"an":[3],"initial":[4],"step":[5],"of":[6,98,116],"video":[7,12,21,32,84,117,193],"analysis,":[8],"temporally":[9],"divides":[10],"heterogeneous":[11],"into":[13,33,41],"semantic":[14,103,123,156],"segments,":[15],"which":[16,146],"is":[17,54,92,111],"widely":[18],"used":[19],"in":[20,125,192],"summarization,":[22],"search,":[23],"browsing":[24],"and":[25,36,65,108,131,150,161,174],"retrieval.":[26],"detection":[29,195],"always":[30],"cuts":[31],"shots":[34,40,53],"first":[35],"then":[37],"groups":[38],"these":[39],"segments.":[42],"In":[43,86],"this":[44,87],"process,":[45],"how":[46],"to":[47,69,94,153],"solve":[48],"complex":[49,96],"dependency":[50,72],"relationship":[51,73],"among":[52],"a":[55,80,89,113,142],"barrier.":[56],"The":[57,164],"existing":[58],"methods":[59],"consider":[60],"using":[61],"Recurrent":[62],"Neural":[63],"Networks":[64],"Hidden":[66],"Markov":[67],"Model":[68],"simulate":[70],"the":[71,102,155,181,186,190],"between":[74,105,158],"shots.":[75],"However,":[76],"linear":[77],"approaches":[78],"work":[79],"little":[81],"on":[82,169],"hierarchical":[83],"structure.":[85],"paper,":[88],"GNN-based":[90],"network":[91],"proposed":[93,165,187],"model":[95],"structures":[97],"videos":[99],"instead.":[100],"Besides,":[101],"gap":[104,157],"low-level":[106,159],"features":[107,160],"high-level":[109,162],"semantics":[110],"also":[112],"big":[114],"obstacle":[115],"detection.":[119],"Here,":[120],"three":[121],"visual":[122],"elements":[124],"shot,":[126],"i.e.,":[127],"environment,":[128],"object,":[129],"action":[130],"audio":[132],"feature":[133],"are":[134],"extracted":[135],"as":[136],"shot":[137],"representation.":[138],"Later,":[139],"we":[140],"utilize":[141],"multi-modal":[143],"fusion":[144,149],"strategy,":[145],"combines":[147],"early":[148],"late":[151],"fusion,":[152],"bridge":[154],"semantics.":[163],"method":[166,188],"was":[167],"evaluated":[168],"BBC":[170],"Planet":[171],"Earth":[172],"dataset":[173],"Open":[175],"Scene":[177],"Detection":[178],"(OSVD)":[179],"dataset,":[180],"experimental":[182],"results":[183],"demonstrate":[184],"that":[185],"outperforms":[189],"state-of-the-art":[191],"task.":[196]},"counts_by_year":[],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
