{"id":"https://openalex.org/W4408324883","doi":"https://doi.org/10.1109/icassp49660.2025.10890433","title":"Adaptive Contribution Modulation For Multi-Modal Manipulation Media Detection and Grounding","display_name":"Adaptive Contribution Modulation For Multi-Modal Manipulation Media Detection and Grounding","publication_year":2025,"publication_date":"2025-03-11","ids":{"openalex":"https://openalex.org/W4408324883","doi":"https://doi.org/10.1109/icassp49660.2025.10890433"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890433","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yixiang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yixiang Li","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":null,"display_name":"Biao Leng","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Biao Leng","raw_affiliation_strings":["School of Computer Science and Engineering, Beihang University,Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Beihang University,Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08723022,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12667","display_name":"Economic and Technological Developments in Russia","score":0.1890999972820282,"subfield":{"id":"https://openalex.org/subfields/3303","display_name":"Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12667","display_name":"Economic and Technological Developments in Russia","score":0.1890999972820282,"subfield":{"id":"https://openalex.org/subfields/3303","display_name":"Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.1762000024318695,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/circuit-breaker","display_name":"Circuit breaker","score":0.8080161809921265},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5256206393241882},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.2640858292579651},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.22865334153175354}],"concepts":[{"id":"https://openalex.org/C61352017","wikidata":"https://www.wikidata.org/wiki/Q211058","display_name":"Circuit breaker","level":2,"score":0.8080161809921265},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5256206393241882},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.2640858292579651},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.22865334153175354}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890433","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890433","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W2962858109","https://openalex.org/W2963416784","https://openalex.org/W2982058372","https://openalex.org/W3034795015","https://openalex.org/W3034900344","https://openalex.org/W3174508664","https://openalex.org/W3174814557","https://openalex.org/W4214691743","https://openalex.org/W4280579728","https://openalex.org/W4360884927","https://openalex.org/W4385805162","https://openalex.org/W4385815563","https://openalex.org/W4386071472","https://openalex.org/W4386076652","https://openalex.org/W4386590781","https://openalex.org/W4386928847","https://openalex.org/W4389520128","https://openalex.org/W4390190315","https://openalex.org/W4390873235","https://openalex.org/W4391952560","https://openalex.org/W4392903163","https://openalex.org/W4392909607","https://openalex.org/W4402716164","https://openalex.org/W4402915519","https://openalex.org/W6763240421","https://openalex.org/W6767924615","https://openalex.org/W6788722341","https://openalex.org/W6853543659"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2186957643","https://openalex.org/W4313289174","https://openalex.org/W2169296235","https://openalex.org/W2383147444","https://openalex.org/W2772771794","https://openalex.org/W2370462073","https://openalex.org/W2351129194"],"abstract_inverted_index":{"In":[0],"response":[1],"to":[2,56,79,154],"the":[3,8,58,66,102,131,141,146],"security":[4],"risks":[5],"posed":[6],"by":[7],"realistic":[9],"propagation":[10],"of":[11,60,104,130,134,149],"manipulated":[12],"media":[13,19],"data,":[14],"detecting":[15],"and":[16,68,90,117],"grounding":[17],"multi-modal":[18,31,61,122],"manipulation":[20],"has":[21],"received":[22],"attention":[23],"as":[24],"a":[25],"challenging":[26],"task.":[27],"However,":[28],"there":[29],"is":[30],"contribution":[32,62,96,120,123],"imbalance":[33],"on":[34,110,140],"current":[35],"approach":[36,151],"for":[37,83,107],"cross-modal":[38,111],"learning,":[39,113,125],"which":[40,86,99,126,144],"affects":[41],"model":[42],"performance":[43,148],"optimisation.":[44],"To":[45,64],"this":[46],"end,":[47],"we":[48,74,94,114],"propose":[49,75,95],"an":[50],"Adaptive":[51],"Contribution":[52],"Modulation":[53],"(ACM)":[54],"framework":[55],"solve":[57],"problem":[59],"imbalance.":[63],"balance":[65,115],"image":[67,116],"text":[69,118],"embedding":[70],"features":[71],"before":[72],"fusion,":[73],"adaptive":[76,89],"weight":[77],"decision":[78],"computes":[80],"dynamic":[81],"weights":[82],"fusion":[84],"features,":[85],"enable":[87],"more":[88],"robust":[91],"decision-making.":[92],"Meanwhile,":[93],"modulation":[97],"block,":[98],"dynamically":[100],"governs":[101],"contributions":[103],"different":[105],"modalities":[106],"optimization.":[108],"Based":[109],"contrastive":[112],"embeddings":[119],"through":[121,152],"balanced":[124],"makes":[127],"better":[128],"use":[129],"semantic":[132],"correlation":[133],"all":[135],"modalities.":[136],"We":[137],"conduct":[138],"experiments":[139],"DGM4":[142],"dataset,":[143],"demonstrate":[145],"superior":[147],"our":[150],"compared":[153],"state-of-the-art":[155],"methods.":[156]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-03-12T00:00:00"}
