{"id":"https://openalex.org/W4416922359","doi":"https://doi.org/10.1109/taffc.2025.3639406","title":"AMuSeD: An Attentive Deep Neural Network for Multimodal Sarcasm Detection Incorporating Bimodal Data Augmentation","display_name":"AMuSeD: An Attentive Deep Neural Network for Multimodal Sarcasm Detection Incorporating Bimodal Data Augmentation","publication_year":2025,"publication_date":"2025-12-02","ids":{"openalex":"https://openalex.org/W4416922359","doi":"https://doi.org/10.1109/taffc.2025.3639406"},"language":"en","primary_location":{"id":"doi:10.1109/taffc.2025.3639406","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2025.3639406","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101560145","display_name":"Xiyuan Gao","orcid":"https://orcid.org/0000-0003-0870-6721"},"institutions":[{"id":"https://openalex.org/I196758499","display_name":"Fryske Akademy","ror":"https://ror.org/05fcmfe52","country_code":"NL","type":"facility","lineage":["https://openalex.org/I196758499"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Xiyuan Gao","raw_affiliation_strings":["Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0003-0870-6721","affiliations":[{"raw_affiliation_string":"Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands","institution_ids":["https://openalex.org/I196758499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076096927","display_name":"Shubhi Bansal","orcid":"https://orcid.org/0000-0002-8034-8220"},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Shubhi Bansal","raw_affiliation_strings":["Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India"],"raw_orcid":"https://orcid.org/0000-0002-8034-8220","affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055897461","display_name":"Kushaan Gowda","orcid":"https://orcid.org/0000-0001-6921-2069"},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Kushaan Gowda","raw_affiliation_strings":["Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India"],"raw_orcid":"https://orcid.org/0000-0001-6921-2069","affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhu Li","orcid":"https://orcid.org/0000-0002-1409-2482"},"institutions":[{"id":"https://openalex.org/I196758499","display_name":"Fryske Akademy","ror":"https://ror.org/05fcmfe52","country_code":"NL","type":"facility","lineage":["https://openalex.org/I196758499"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Zhu Li","raw_affiliation_strings":["Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-1409-2482","affiliations":[{"raw_affiliation_string":"Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands","institution_ids":["https://openalex.org/I196758499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001110193","display_name":"Shekhar Nayak","orcid":"https://orcid.org/0000-0002-4277-4851"},"institutions":[{"id":"https://openalex.org/I196758499","display_name":"Fryske Akademy","ror":"https://ror.org/05fcmfe52","country_code":"NL","type":"facility","lineage":["https://openalex.org/I196758499"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Shekhar Nayak","raw_affiliation_strings":["Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-4277-4851","affiliations":[{"raw_affiliation_string":"Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands","institution_ids":["https://openalex.org/I196758499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009822257","display_name":"Nagendra Kumar","orcid":"https://orcid.org/0000-0003-4644-3168"},"institutions":[{"id":"https://openalex.org/I64295750","display_name":"Indian Institute of Technology Indore","ror":"https://ror.org/01hhf7w52","country_code":"IN","type":"education","lineage":["https://openalex.org/I64295750"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Nagendra Kumar","raw_affiliation_strings":["Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India"],"raw_orcid":"https://orcid.org/0000-0003-4644-3168","affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Indian Institute of Technology Indore, Indore, India","institution_ids":["https://openalex.org/I64295750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090819693","display_name":"Matt Coler","orcid":"https://orcid.org/0000-0002-7631-5063"},"institutions":[{"id":"https://openalex.org/I196758499","display_name":"Fryske Akademy","ror":"https://ror.org/05fcmfe52","country_code":"NL","type":"facility","lineage":["https://openalex.org/I196758499"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Matt Coler","raw_affiliation_strings":["Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-7631-5063","affiliations":[{"raw_affiliation_string":"Campus Frysl&#x00E2;n, University of Groningen, Leeuwarden, The Netherlands","institution_ids":["https://openalex.org/I196758499"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101560145"],"corresponding_institution_ids":["https://openalex.org/I196758499"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19382849,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"17","issue":"1","first_page":"900","last_page":"912"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.5996000170707703,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.5996000170707703,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.11599999666213989,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11148","display_name":"Language, Metaphor, and Cognition","score":0.02419999986886978,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sarcasm","display_name":"Sarcasm","score":0.9843999743461609},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.49959999322891235},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4666999876499176},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.46129998564720154},{"id":"https://openalex.org/keywords/scarcity","display_name":"Scarcity","score":0.3788999915122986},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.37059998512268066}],"concepts":[{"id":"https://openalex.org/C2776207355","wikidata":"https://www.wikidata.org/wiki/Q191035","display_name":"Sarcasm","level":3,"score":0.9843999743461609},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.684499979019165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6710000038146973},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.49959999322891235},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4666999876499176},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.46129998564720154},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42719998955726624},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4171000123023987},{"id":"https://openalex.org/C109747225","wikidata":"https://www.wikidata.org/wiki/Q815758","display_name":"Scarcity","level":2,"score":0.3788999915122986},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3255999982357025},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.2939000129699707},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29109999537467957},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2508000135421753}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/taffc.2025.3639406","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taffc.2025.3639406","pdf_url":null,"source":{"id":"https://openalex.org/S104780363","display_name":"IEEE Transactions on Affective Computing","issn_l":"1949-3045","issn":["1949-3045","2371-9850"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Affective Computing","raw_type":"journal-article"},{"id":"pmh:oai:pure.rug.nl:openaire_cris_publications/d749283e-0823-46db-a15c-45099abef46a","is_oa":false,"landing_page_url":"https://research.rug.nl/en/publications/d749283e-0823-46db-a15c-45099abef46a","pdf_url":null,"source":{"id":"https://openalex.org/S4306400420","display_name":"University of Groningen research database (University of Groningen / Centre for Information Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I169381384","host_organization_name":"University of Groningen","host_organization_lineage":["https://openalex.org/I169381384"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Gao, X, Bansal, S, Gowda, K, Li, Z, Nayak, S, Kumar, N & Coler, M 2026, 'AMuSeD : An Attentive Deep Neural Network for Multimodal Sarcasm Detection Incorporating Bi-modal Data Augmentation', IEEE Transactions on Affective Computing, vol. 17, no. 1, pp. 900-912. https://doi.org/10.1109/TAFFC.2025.3639406","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.rug.nl:publications/d749283e-0823-46db-a15c-45099abef46a","is_oa":false,"landing_page_url":"https://hdl.handle.net/11370/d749283e-0823-46db-a15c-45099abef46a","pdf_url":null,"source":{"id":"https://openalex.org/S4306400420","display_name":"University of Groningen research database (University of Groningen / Centre for Information Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I169381384","host_organization_name":"University of Groningen","host_organization_lineage":["https://openalex.org/I169381384"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Gao, X, Bansal, S, Gowda, K, Li, Z, Nayak, S, Kumar, N & Coler, M 2026, 'AMuSeD : An Attentive Deep Neural Network for Multimodal Sarcasm Detection Incorporating Bi-modal Data Augmentation', IEEE Transactions on Affective Computing, vol. 17, no. 1, pp. 900-912. https://doi.org/10.1109/TAFFC.2025.3639406","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Detecting":[0],"sarcasm":[1,22,97],"effectively":[2],"requires":[3],"a":[4,62,89,103,145],"nuanced":[5],"understanding":[6],"of":[7,31,88,148],"context,":[8],"including":[9],"vocal":[10],"tones":[11],"and":[12,60],"facial":[13],"expressions.":[14],"The":[15,68,82],"progression":[16],"towards":[17],"multimodal":[18],"computational":[19],"methods":[20],"in":[21,150],"detection,":[23],"however,":[24],"faces":[25],"challenges":[26],"due":[27],"to":[28,98,132],"the":[29,54,86,116,134,141,161],"scarcity":[30],"data.":[32],"To":[33],"address":[34],"this,":[35],"we":[36],"present":[37],"AMuSeD":[38],"(Attentive":[39],"deep":[40],"neural":[41],"network":[42],"for":[43,96,115,125],"MUltimodal":[44],"Sarcasm":[45,56],"dEtection":[46],"incorporating":[47],"bi-modal":[48],"Data":[49],"augmentation).":[50],"This":[51],"approach":[52,143],"utilizes":[53],"Multimodal":[55],"Detection":[57],"Dataset":[58],"(MUStARD)":[59],"introduces":[61],"two-phase":[63],"bimodal":[64],"data":[65],"augmentation":[66],"strategy.":[67],"first":[69],"phase":[70,84],"involves":[71,85],"generating":[72],"varied":[73],"text":[74,117],"samples":[75],"through":[76],"Back-Translation":[77],"from":[78,160],"several":[79],"secondary":[80],"languages.":[81],"second":[83],"refinement":[87],"FastSpeech2-based":[90],"speech":[91],"synthesis":[92],"system,":[93],"tailored":[94],"specifically":[95],"retain":[99],"sarcastic":[100],"intonations.":[101],"Alongside":[102],"cloud-based":[104],"Text-to-Speech":[105],"(TTS)":[106],"service,":[107],"this":[108],"Fine-tuned":[109],"FastSpeech2":[110],"system":[111],"produces":[112],"corresponding":[113],"audio":[114],"augmentations.":[118],"We":[119],"also":[120],"evaluate":[121],"various":[122],"attention":[123],"mechanisms":[124],"selectively":[126],"enhancing":[127],"sarcasm-relevant":[128],"features,":[129],"finding":[130],"self-attention":[131],"be":[133],"most":[135],"efficient.":[136],"Our":[137],"experiments":[138],"reveal":[139],"that":[140,156],"proposed":[142],"achieves":[144],"significant":[146],"F1-score":[147],"81.0%":[149],"text-audio":[151],"modalities,":[152],"surpassing":[153],"even":[154],"models":[155],"use":[157],"three":[158],"modalities":[159],"MUStARD":[162],"dataset.":[163]},"counts_by_year":[],"updated_date":"2026-03-03T06:13:14.889584","created_date":"2025-12-02T00:00:00"}
