{"id":"https://openalex.org/W4387969327","doi":"https://doi.org/10.1145/3581783.3612526","title":"Training Multimedia Event Extraction With Generated Images and Captions","display_name":"Training Multimedia Event Extraction With Generated Images and Captions","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387969327","doi":"https://doi.org/10.1145/3581783.3612526"},"language":"en","primary_location":{"id":"doi:10.1145/3581783.3612526","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612526","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612526","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612526","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049430074","display_name":"Zilin Du","orcid":"https://orcid.org/0000-0003-3534-9547"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zilin Du","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-3534-9547","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019703861","display_name":"Yunxin Li","orcid":"https://orcid.org/0000-0003-4819-2489"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunxin Li","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0003-4819-2489","affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021507977","display_name":"Xu Guo","orcid":"https://orcid.org/0000-0003-1034-9508"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xu Guo","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-1034-9508","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103010040","display_name":"Yidan Sun","orcid":"https://orcid.org/0000-0002-7897-3035"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yidan Sun","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-7897-3035","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100732746","display_name":"Boyang Li","orcid":"https://orcid.org/0000-0002-6230-2376"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Boyang Li","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-6230-2376","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6737,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.71912338,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5504","last_page":"5513"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8257439136505127},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7274801731109619},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.7021334767341614},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5838258862495422},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5772752165794373},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5285162925720215},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.503879725933075},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4903299808502197},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.470638245344162},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.4380591809749603},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4233127534389496},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.42278599739074707},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.41907137632369995},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4097784161567688},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12602290511131287}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8257439136505127},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7274801731109619},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.7021334767341614},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5838258862495422},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5772752165794373},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5285162925720215},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.503879725933075},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4903299808502197},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.470638245344162},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.4380591809749603},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4233127534389496},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.42278599739074707},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.41907137632369995},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4097784161567688},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12602290511131287},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3581783.3612526","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612526","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612526","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3581783.3612526","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3581783.3612526","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3581783.3612526","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Multimedia","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6597490799","display_name":null,"funder_award_id":"NRF-NRFF13-2021-0006","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387969327.pdf","grobid_xml":"https://content.openalex.org/works/W4387969327.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W2063464767","https://openalex.org/W2251199578","https://openalex.org/W2423576022","https://openalex.org/W2560747010","https://openalex.org/W2604673901","https://openalex.org/W2604783118","https://openalex.org/W2753738274","https://openalex.org/W2766863698","https://openalex.org/W2891553865","https://openalex.org/W2930957955","https://openalex.org/W2997585029","https://openalex.org/W2999905431","https://openalex.org/W3011727199","https://openalex.org/W3034184697","https://openalex.org/W3035333188","https://openalex.org/W3096682293","https://openalex.org/W3098383912","https://openalex.org/W3154063293","https://openalex.org/W3168620925","https://openalex.org/W3168900788","https://openalex.org/W3169436550","https://openalex.org/W3174691968","https://openalex.org/W3176032431","https://openalex.org/W3176453404","https://openalex.org/W3176951816","https://openalex.org/W3181951703","https://openalex.org/W3207166518","https://openalex.org/W4200630531","https://openalex.org/W4205157616","https://openalex.org/W4221159406","https://openalex.org/W4224903949","https://openalex.org/W4281485151","https://openalex.org/W4287019595","https://openalex.org/W4292433237","https://openalex.org/W4304086159","https://openalex.org/W4312407537","https://openalex.org/W4312900708","https://openalex.org/W4312933868","https://openalex.org/W4385572711","https://openalex.org/W6600175266","https://openalex.org/W6600339963","https://openalex.org/W6679942958"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W203959209","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W4307407935"],"abstract_inverted_index":{"Contemporary":[0],"news":[1],"reporting":[2],"increasingly":[3],"features":[4,98],"multimedia":[5,10,126],"content,":[6],"motivating":[7],"research":[8],"on":[9,59,88,121,138,146],"event":[11,139],"extraction.":[12],"However,":[13],"the":[14,28,32,86,89,122,132,157,167],"task":[15],"lacks":[16],"annotated":[17],"multimodal":[18,51,65,91],"training":[19,24,52,61,66,110,171],"data":[20,25,53,67,172],"and":[21,54,76,108,142],"artificially":[22,49],"generated":[23,50],"suffer":[26],"from":[27,31,156],"distribution":[29],"shift":[30],"real-world":[33],"data.":[34],"In":[35,93],"this":[36],"paper,":[37],"we":[38,63,84,104,130],"propose":[39],"Cross-modality":[40],"Augmented":[41],"Multimedia":[42],"Event":[43],"Learning":[44],"(CAMEL),":[45],"which":[46,149],"successfully":[47],"utilizes":[48],"achieves":[55],"state-of-the-art":[56,118],"performance.":[57],"Conditioned":[58],"unimodal":[60],"data,":[62],"generate":[64],"using":[68],"off-the-shelf":[69],"image":[70,77],"generators":[71],"like":[72,79],"Stable":[73],"Diffusion":[74],"[45]":[75],"captioners":[78],"BLIP":[80],"[24].":[81],"After":[82],"that,":[83],"train":[85],"network":[87],"resultant":[90],"datasets.":[92],"order":[94],"to":[95,165],"learn":[96],"robust":[97],"that":[99,115,151],"are":[100],"effective":[101],"across":[102],"domains,":[103],"devise":[105],"an":[106],"iterative":[107],"gradual":[109],"strategy.":[111],"Substantial":[112],"experiments":[113],"show":[114],"CAMEL":[116,152],"surpasses":[117],"(SOTA)":[119],"baselines":[120],"M2E2":[123],"benchmark.":[124],"On":[125],"events":[127],"in":[128,173],"particular,":[129],"outperform":[131],"prior":[133],"SOTA":[134],"by":[135,143],"4.2%":[136],"F1":[137,145],"mention":[140],"identification":[141],"9.8%":[144],"argument":[147],"identification,":[148],"demonstrates":[150,162],"learns":[153],"synergistic":[154],"representations":[155],"two":[158],"modalities.":[159],"Our":[160],"work":[161],"a":[163],"recipe":[164],"unleash":[166],"power":[168],"of":[169],"synthetic":[170],"structured":[174],"prediction.":[175]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
