{"id":"https://openalex.org/W4402351112","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651049","title":"Multimodal Video Highlight Detection with Noise-Robust Learning","display_name":"Multimodal Video Highlight Detection with Noise-Robust Learning","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402351112","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651049"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10651049","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109840598","display_name":"Yinhui Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yinhui Jiang","raw_affiliation_strings":["Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China"],"affiliations":[{"raw_affiliation_string":"Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072269410","display_name":"Sihui Luo","orcid":"https://orcid.org/0000-0003-2822-0446"},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sihui Luo","raw_affiliation_strings":["Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China"],"affiliations":[{"raw_affiliation_string":"Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013717269","display_name":"Lijun Guo","orcid":"https://orcid.org/0000-0002-6133-9564"},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lijun Guo","raw_affiliation_strings":["Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China"],"affiliations":[{"raw_affiliation_string":"Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China","institution_ids":["https://openalex.org/I109935558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101618645","display_name":"Rong Zhang","orcid":"https://orcid.org/0000-0001-8019-245X"},"institutions":[{"id":"https://openalex.org/I109935558","display_name":"Ningbo University","ror":"https://ror.org/03et85d35","country_code":"CN","type":"education","lineage":["https://openalex.org/I109935558"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rong Zhang","raw_affiliation_strings":["Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China"],"affiliations":[{"raw_affiliation_string":"Ningbo University,The Faculty of Electrical Engineering and Computer Science,Ningbo,China","institution_ids":["https://openalex.org/I109935558"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5109840598"],"corresponding_institution_ids":["https://openalex.org/I109935558"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14191905,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7520924210548401},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5379221439361572},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5083553194999695},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4284241795539856},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.41148841381073},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.10039246082305908}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7520924210548401},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5379221439361572},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5083553194999695},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4284241795539856},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41148841381073},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.10039246082305908}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10651049","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651049","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322927","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W329267344","https://openalex.org/W398859631","https://openalex.org/W1924343884","https://openalex.org/W2103908291","https://openalex.org/W2115245686","https://openalex.org/W2143800062","https://openalex.org/W2155635849","https://openalex.org/W2170095155","https://openalex.org/W2194345886","https://openalex.org/W2467794422","https://openalex.org/W2593116425","https://openalex.org/W2619947201","https://openalex.org/W2737677090","https://openalex.org/W2788321336","https://openalex.org/W2791295466","https://openalex.org/W2797074994","https://openalex.org/W2803187616","https://openalex.org/W2897091983","https://openalex.org/W2919974746","https://openalex.org/W2947049994","https://openalex.org/W2963524571","https://openalex.org/W2963691181","https://openalex.org/W2963729528","https://openalex.org/W2963735582","https://openalex.org/W2981873476","https://openalex.org/W2996108195","https://openalex.org/W2996988779","https://openalex.org/W2997669288","https://openalex.org/W3034185248","https://openalex.org/W3094550259","https://openalex.org/W3104255659","https://openalex.org/W3105607218","https://openalex.org/W3106645934","https://openalex.org/W3109316002","https://openalex.org/W3110687497","https://openalex.org/W3174906557","https://openalex.org/W3196253003","https://openalex.org/W3201832684","https://openalex.org/W3202168743","https://openalex.org/W4312544061","https://openalex.org/W4312680331","https://openalex.org/W4313014573","https://openalex.org/W6751420435","https://openalex.org/W6751647823","https://openalex.org/W6763576130","https://openalex.org/W6771630921","https://openalex.org/W6781645381","https://openalex.org/W6785821353","https://openalex.org/W6791353385","https://openalex.org/W6797613833","https://openalex.org/W6849777976","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Video":[0],"highlight":[1,32,80,182],"detection":[2,33,81],"aims":[3],"to":[4,121,127],"select":[5],"the":[6,20,43,67,103,129,136,141,168,176],"most":[7],"interesting":[8],"and":[9,23,41,97,160,162,178],"attractive":[10],"clips":[11],"from":[12,108,147],"lengthy":[13],"videos,":[14],"which":[15],"is":[16],"crucial":[17],"for":[18,102],"enhancing":[19],"video":[21,31,51,79,181],"editing":[22],"viewing":[24],"experience":[25],"on":[26,37,135,154],"social":[27],"media":[28],"platforms.":[29],"Existing":[30],"methods":[34],"predominantly":[35],"rely":[36],"visual":[38,96],"modality":[39],"information,":[40],"underutilize":[42],"abundant":[44],"multimodality":[45],"of":[46,93,105,132,170,180],"videos.":[47],"Furthermore,":[48],"in":[49,166],"supervised":[50],"analysis":[52],"tasks,":[53],"subjective":[54],"judgments":[55],"during":[56],"label":[57],"annotation":[58],"can":[59],"generate":[60],"uncertain":[61],"noise":[62,123,133,171],"labels":[63],"that":[64,117,140],"negatively":[65],"impact":[66,131,169],"learning":[68,137],"process.":[69],"To":[70],"address":[71],"these":[72],"issues,":[73],"we":[74],"propose":[75],"a":[76,94,114],"noise-robust":[77],"multimodal":[78,91],"approach.":[82],"Our":[83],"approach":[84,153],"first":[85],"enhances":[86],"feature":[87],"representation":[88],"by":[89],"incorporating":[90],"representations":[92],"video\u2019s":[95],"auditory":[98],"information.":[99],"This":[100,125],"allows":[101],"extraction":[104],"complementary":[106],"information":[107],"different":[109],"modalities.":[110],"We":[111,150],"then":[112],"implement":[113],"noise-cleaning":[115],"mechanism":[116],"utilizes":[118],"multiple":[119],"modalities":[120],"clean":[122,148],"samples.":[124,149],"helps":[126],"suppress":[128],"negative":[130],"samples":[134],"process,":[138],"ensuring":[139],"network":[142],"learns":[143],"more":[144],"robust":[145],"features":[146],"evaluate":[151],"our":[152],"two":[155],"public":[156],"datasets,":[157],"YouTube":[158],"Highlights":[159],"TVSum,":[161],"demonstrate":[163],"its":[164],"efficacy":[165],"mitigating":[167],"labels,":[172],"while":[173],"also":[174],"improving":[175],"accuracy":[177],"robustness":[179],"detection.":[183]},"counts_by_year":[],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
