{"id":"https://openalex.org/W3180895563","doi":"https://doi.org/10.1162/tacl_a_00389","title":"Self-supervised Regularization for Text Classification","display_name":"Self-supervised Regularization for Text Classification","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3180895563","doi":"https://doi.org/10.1162/tacl_a_00389","mag":"3180895563"},"language":"en","primary_location":{"id":"doi:10.1162/tacl_a_00389","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00389","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00389/1930826/tacl_a_00389.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00389/1930826/tacl_a_00389.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006219919","display_name":"Meng Zhou","orcid":"https://orcid.org/0000-0001-6485-8995"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Meng Zhou","raw_affiliation_strings":["Shanghai Jiao Tong University, China. zhoumeng9904@sjtu.edu.cn"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, China. zhoumeng9904@sjtu.edu.cn","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020605281","display_name":"Zechen Li","orcid":null},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zechen Li","raw_affiliation_strings":["Northeastern University, United States. li.zec@northeastern.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northeastern University, United States. li.zec@northeastern.edu","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083884675","display_name":"Pengtao Xie","orcid":"https://orcid.org/0000-0003-0521-174X"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Pengtao Xie","raw_affiliation_strings":["UC San Diego, United States. p1xie@eng.ucsd.edu"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"UC San Diego, United States. p1xie@eng.ucsd.edu","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5006219919","https://openalex.org/A5020605281","https://openalex.org/A5083884675"],"corresponding_institution_ids":["https://openalex.org/I12912129","https://openalex.org/I183067930","https://openalex.org/I36258959"],"apc_list":null,"apc_paid":null,"fwci":0.9794,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.80613315,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"9","issue":null,"first_page":"641","last_page":"656"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.9084482192993164},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8619515895843506},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.7251250743865967},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6821691989898682},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.6488999128341675},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6034013628959656},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5796502232551575},{"id":"https://openalex.org/keywords/semi-supervised-learning","display_name":"Semi-supervised learning","score":0.5061931014060974},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4519228935241699},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.41560399532318115},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4109148681163788},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39378952980041504},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3402770757675171},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.14772331714630127}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.9084482192993164},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8619515895843506},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.7251250743865967},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6821691989898682},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.6488999128341675},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6034013628959656},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5796502232551575},{"id":"https://openalex.org/C58973888","wikidata":"https://www.wikidata.org/wiki/Q1041418","display_name":"Semi-supervised learning","level":2,"score":0.5061931014060974},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4519228935241699},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.41560399532318115},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4109148681163788},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39378952980041504},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3402770757675171},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.14772331714630127},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/tacl_a_00389","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00389","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00389/1930826/tacl_a_00389.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:1f14ed4fa4164639b9c781fae7d0910b","is_oa":false,"landing_page_url":"https://doaj.org/article/1f14ed4fa4164639b9c781fae7d0910b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Transactions of the Association for Computational Linguistics, Vol 9, Pp 641-656 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/tacl_a_00389","is_oa":true,"landing_page_url":"https://doi.org/10.1162/tacl_a_00389","pdf_url":"https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl_a_00389/1930826/tacl_a_00389.pdf","source":{"id":"https://openalex.org/S2729999759","display_name":"Transactions of the Association for Computational Linguistics","issn_l":"2307-387X","issn":["2307-387X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Transactions of the Association for Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5899999737739563}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3180895563.pdf","grobid_xml":"https://content.openalex.org/works/W3180895563.grobid-xml"},"referenced_works_count":104,"referenced_works":["https://openalex.org/W1924770834","https://openalex.org/W2027731328","https://openalex.org/W2053186076","https://openalex.org/W2064675550","https://openalex.org/W2064794832","https://openalex.org/W2081580037","https://openalex.org/W2113459411","https://openalex.org/W2120615054","https://openalex.org/W2130942839","https://openalex.org/W2194775991","https://openalex.org/W2265846598","https://openalex.org/W2279376656","https://openalex.org/W2284289336","https://openalex.org/W2326925005","https://openalex.org/W2407776548","https://openalex.org/W2559655401","https://openalex.org/W2582630951","https://openalex.org/W2612690371","https://openalex.org/W2741271950","https://openalex.org/W2768282280","https://openalex.org/W2769857323","https://openalex.org/W2785325870","https://openalex.org/W2798991696","https://openalex.org/W2808556605","https://openalex.org/W2842511635","https://openalex.org/W2896457183","https://openalex.org/W2923014074","https://openalex.org/W2955041501","https://openalex.org/W2963012544","https://openalex.org/W2963026768","https://openalex.org/W2963103975","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963420272","https://openalex.org/W2963639288","https://openalex.org/W2963718112","https://openalex.org/W2964700958","https://openalex.org/W2964935470","https://openalex.org/W2965373594","https://openalex.org/W2970235454","https://openalex.org/W2970597249","https://openalex.org/W2971155163","https://openalex.org/W2971296908","https://openalex.org/W2982399380","https://openalex.org/W2990138404","https://openalex.org/W2992922049","https://openalex.org/W2996428491","https://openalex.org/W2997200074","https://openalex.org/W2998186887","https://openalex.org/W3005680577","https://openalex.org/W3015777882","https://openalex.org/W3017243633","https://openalex.org/W3026732421","https://openalex.org/W3034238904","https://openalex.org/W3034985160","https://openalex.org/W3034999214","https://openalex.org/W3035524453","https://openalex.org/W3036170826","https://openalex.org/W3082274269","https://openalex.org/W3086452730","https://openalex.org/W3093937711","https://openalex.org/W3100345210","https://openalex.org/W3115293622","https://openalex.org/W3117088788","https://openalex.org/W3156333129","https://openalex.org/W3173679616","https://openalex.org/W4236965008","https://openalex.org/W4245267204","https://openalex.org/W4247780151","https://openalex.org/W4256229248","https://openalex.org/W4285618474","https://openalex.org/W4287812705","https://openalex.org/W4288089799","https://openalex.org/W4297808394","https://openalex.org/W6640212811","https://openalex.org/W6675802400","https://openalex.org/W6676984168","https://openalex.org/W6679436768","https://openalex.org/W6685053522","https://openalex.org/W6687483927","https://openalex.org/W6695662000","https://openalex.org/W6713582272","https://openalex.org/W6739901393","https://openalex.org/W6746052068","https://openalex.org/W6747899497","https://openalex.org/W6755207826","https://openalex.org/W6763416564","https://openalex.org/W6763701032","https://openalex.org/W6766673545","https://openalex.org/W6767026726","https://openalex.org/W6768021236","https://openalex.org/W6769311223","https://openalex.org/W6769627184","https://openalex.org/W6770717842","https://openalex.org/W6774314701","https://openalex.org/W6775563663","https://openalex.org/W6775634482","https://openalex.org/W6776523511","https://openalex.org/W6776700526","https://openalex.org/W6780178746","https://openalex.org/W6780226713","https://openalex.org/W6783023299","https://openalex.org/W6784910178","https://openalex.org/W6844194202"],"related_works":["https://openalex.org/W2989610201","https://openalex.org/W2131513867","https://openalex.org/W2133556223","https://openalex.org/W4306904961","https://openalex.org/W4318825627","https://openalex.org/W2752124967","https://openalex.org/W2184099506","https://openalex.org/W4287278258","https://openalex.org/W3134858141","https://openalex.org/W3180895563"],"abstract_inverted_index":{"Abstract":[0],"Text":[1],"classification":[2,22,84,135,141],"is":[3,24,54,97,100,151],"a":[4,40,82,113,127],"widely":[5],"studied":[6],"problem":[7],"and":[8,71,86],"has":[9],"broad":[10],"applications.":[11],"In":[12,80],"many":[13],"real-world":[14],"problems,":[15],"the":[16,121,134,144],"number":[17,129],"of":[18,130,146],"texts":[19,105],"for":[20],"training":[21],"models":[23,29],"limited,":[25],"which":[26,99],"renders":[27],"these":[28,77],"prone":[30],"to":[31,126],"overfitting.":[32],"To":[33],"address":[34],"this":[35],"problem,":[36],"we":[37],"propose":[38],"SSL-Reg,":[39,81],"data-dependent":[41],"regularization":[42],"approach":[43,58],"based":[44],"on":[45,63,103,138],"self-supervised":[46],"learning":[47,57],"(SSL).":[48],"SSL":[49,89,95,117],"(Devlin":[50],"et":[51],"al.,":[52],"2019a)":[53],"an":[55,87,116],"unsupervised":[56,88],"that":[59],"defines":[60],"auxiliary":[61,78],"tasks":[62],"input":[64,104],"data":[65,73],"without":[66,106],"using":[67,107,115],"any":[68,108],"human-provided":[69],"labels":[70,132],"learns":[72],"representations":[74],"by":[75],"solving":[76],"tasks.":[79],"supervised":[83],"task":[85,90,96,118],"are":[91],"performed":[92],"simultaneously.":[93],"The":[94],"unsupervised,":[98],"defined":[101],"purely":[102],"human-":[109],"provided":[110],"labels.":[111],"Training":[112],"model":[114,122],"can":[119],"prevent":[120],"from":[123],"being":[124],"overfitted":[125],"limited":[128],"class":[131],"in":[133],"task.":[136],"Experiments":[137],"17":[139],"text":[140],"datasets":[142],"demonstrate":[143],"effectiveness":[145],"our":[147],"proposed":[148],"method.":[149],"Code":[150],"available":[152],"at":[153],"https://github.com/UCSD-AI4H/SSReg.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-05-21T09:19:25.381259","created_date":"2025-10-10T00:00:00"}
