{"id":"https://openalex.org/W4372272424","doi":"https://doi.org/10.1109/icassp49357.2023.10095209","title":"Improving the out-of-Distribution Generalization Capability of Language Models: Counterfactually-Augmented Data is not Enough","display_name":"Improving the out-of-Distribution Generalization Capability of Language Models: Counterfactually-Augmented Data is not Enough","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372272424","doi":"https://doi.org/10.1109/icassp49357.2023.10095209"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10095209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006419976","display_name":"Caoyun Fan","orcid":"https://orcid.org/0000-0001-7360-3468"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Caoyun Fan","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100628705","display_name":"Wenqing Chen","orcid":"https://orcid.org/0000-0002-8739-2216"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenqing Chen","raw_affiliation_strings":["Sun Yat-sen University,School of Software Engineering,China","School of Software Engineering, Sun Yat-sen University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Software Engineering,China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"School of Software Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110766031","display_name":"Jidong Tian","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jidong Tian","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101479911","display_name":"Yitian Li","orcid":"https://orcid.org/0000-0001-9714-1368"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yitian Li","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025662871","display_name":"Hao He","orcid":"https://orcid.org/0000-0002-5385-8022"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao He","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085787425","display_name":"Yaohui Jin","orcid":"https://orcid.org/0000-0001-6158-6277"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaohui Jin","raw_affiliation_strings":["Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,MoE Key Lab of Artificial Intelligence, AI Institute,China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"MoE Key Lab of Artificial Intelligence, AI Institute, Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8158,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.77372389,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9814000129699707,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.785772442817688},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6490457057952881},{"id":"https://openalex.org/keywords/distribution","display_name":"Distribution (mathematics)","score":0.4642779231071472},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3777152895927429},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17774075269699097}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.785772442817688},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6490457057952881},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.4642779231071472},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3777152895927429},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17774075269699097},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10095209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10095209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.75,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W36434594","https://openalex.org/W1840435438","https://openalex.org/W2031342017","https://openalex.org/W2035174176","https://openalex.org/W2038721957","https://openalex.org/W2064675550","https://openalex.org/W2113459411","https://openalex.org/W2170240176","https://openalex.org/W2251939518","https://openalex.org/W2896457183","https://openalex.org/W2951286828","https://openalex.org/W2962893388","https://openalex.org/W2963846996","https://openalex.org/W2965373594","https://openalex.org/W2971196067","https://openalex.org/W2977235550","https://openalex.org/W3092928935","https://openalex.org/W3103651020","https://openalex.org/W3103873238","https://openalex.org/W3104169042","https://openalex.org/W3106544837","https://openalex.org/W3176197839","https://openalex.org/W3177397812","https://openalex.org/W3177575812","https://openalex.org/W3189951784","https://openalex.org/W3196850540","https://openalex.org/W3213445505","https://openalex.org/W6601502966","https://openalex.org/W6676984168","https://openalex.org/W6685053522","https://openalex.org/W6691459498","https://openalex.org/W6755207826","https://openalex.org/W6766673545","https://openalex.org/W6768299147","https://openalex.org/W6784247468","https://openalex.org/W6800440403","https://openalex.org/W7016219665"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W3162204513","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890"],"abstract_inverted_index":{"Counterfactually-Augmented":[0],"Data":[1],"(CAD)":[2],"has":[3],"the":[4,28,47,66,77,87,111,129],"potential":[5,78,139],"to":[6,19,49,97],"improve":[7,141],"language":[8,17,55,99,142],"models\u2019":[9,143],"Out-Of-Distribution":[10],"(OOD)":[11],"generalization":[12,33,113,145],"capability,":[13],"as":[14,38,40],"CAD":[15,35,80],"induces":[16],"models":[18,56,100],"exploit":[20],"causal":[21,60,72,104],"features":[22,61,105],"and":[23,68,124,128,140],"exclude":[24,69],"spurious":[25],"correlations.":[26],"However,":[27],"empirical":[29],"results":[30,131],"of":[31,79,90],"OOD":[32,112,144],"on":[34,59,86,119],"are":[36,63],"not":[37,82],"efficient":[39],"expected.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45,92],"attribute":[46],"inefficiency":[48],"Myopia":[50],"Phenomenon":[51],"caused":[52],"by":[53],"CAD:":[54],"only":[57],"focus":[58],"that":[62,133],"edited":[64],"in":[65,107],"augmentation":[67],"other":[70],"non-edited":[71],"features.":[73],"As":[74],"a":[75],"result,":[76],"is":[81],"fully":[83],"exploited.":[84],"Based":[85],"structural":[88],"properties":[89],"CAD,":[91,108],"design":[93],"two":[94,120],"additional":[95],"constraints":[96],"help":[98],"extract":[101],"more":[102],"complete":[103],"contained":[106],"thus":[109],"improving":[110],"capability.":[114,146],"We":[115],"evaluate":[116],"our":[117,134],"method":[118,135],"tasks:":[121],"Sentiment":[122],"Analysis":[123],"Natural":[125],"Language":[126],"Inference,":[127],"experimental":[130],"demonstrate":[132],"could":[136],"unlock":[137],"CAD\u2019s":[138]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
