{"id":"https://openalex.org/W2948096105","doi":"https://doi.org/10.18653/v1/p19-1590","title":"Variational Pretraining for Semi-supervised Text Classification","display_name":"Variational Pretraining for Semi-supervised Text Classification","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2948096105","doi":"https://doi.org/10.18653/v1/p19-1590","mag":"2948096105"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1590","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1590","pdf_url":"https://www.aclweb.org/anthology/P19-1590.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1590.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075783850","display_name":"Suchin Gururangan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156221","display_name":"Allen Institute for Artificial Intelligence","ror":"https://ror.org/05w520734","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156221"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Suchin Gururangan","raw_affiliation_strings":["Allen Institute for Artificial Intelligence, Seattle, WA, USA","ALLEN INSTITUTE FOR ARTIFICIAL INTELLIGENCE"],"affiliations":[{"raw_affiliation_string":"Allen Institute for Artificial Intelligence, Seattle, WA, USA","institution_ids":["https://openalex.org/I4210156221"]},{"raw_affiliation_string":"ALLEN INSTITUTE FOR ARTIFICIAL INTELLIGENCE","institution_ids":["https://openalex.org/I4210156221"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018599572","display_name":"Tam Dang","orcid":"https://orcid.org/0000-0002-3602-1917"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tam Dang","raw_affiliation_strings":["Paul G. Allen School of Computer Science & Engineering, University of Washington, Seattle, WA, USA","University of Washington ;"],"affiliations":[{"raw_affiliation_string":"Paul G. Allen School of Computer Science & Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"University of Washington ;","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070767948","display_name":"Dallas Card","orcid":"https://orcid.org/0000-0001-5573-8836"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dallas Card","raw_affiliation_strings":["Machine Learning Department, Carnegie Mellon University, Pittsburgh, PA, USA","University of Washington ;"],"affiliations":[{"raw_affiliation_string":"Machine Learning Department, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"University of Washington ;","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088517824","display_name":"Noah A. Smith","orcid":"https://orcid.org/0000-0002-2310-6380"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]},{"id":"https://openalex.org/I4210156221","display_name":"Allen Institute for Artificial Intelligence","ror":"https://ror.org/05w520734","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156221"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Noah A. Smith","raw_affiliation_strings":["Allen Institute for Artificial Intelligence, Seattle, WA, USA","Paul G. Allen School of Computer Science & Engineering, University of Washington, Seattle, WA, USA","Carnegie Mellon University"],"affiliations":[{"raw_affiliation_string":"Allen Institute for Artificial Intelligence, Seattle, WA, USA","institution_ids":["https://openalex.org/I4210156221"]},{"raw_affiliation_string":"Paul G. Allen School of Computer Science & Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Carnegie Mellon University","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5075783850"],"corresponding_institution_ids":["https://openalex.org/I4210156221"],"apc_list":null,"apc_paid":null,"fwci":1.6897952,"has_fulltext":true,"cited_by_count":14,"citation_normalized_percentile":{"value":0.87244222,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5880","last_page":"5894"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.9093716740608215},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.7411198019981384},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7145140767097473},{"id":"https://openalex.org/keywords/vampire","display_name":"Vampire","score":0.7131859064102173},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5776656866073608},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5114099383354187},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.488755464553833},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.46455448865890503},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45870622992515564},{"id":"https://openalex.org/keywords/predictive-coding","display_name":"Predictive coding","score":0.44904860854148865},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.1648852527141571},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.10404998064041138},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08052194118499756}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.9093716740608215},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.7411198019981384},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7145140767097473},{"id":"https://openalex.org/C2776562800","wikidata":"https://www.wikidata.org/wiki/Q7912960","display_name":"Vampire","level":2,"score":0.7131859064102173},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5776656866073608},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5114099383354187},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.488755464553833},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.46455448865890503},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45870622992515564},{"id":"https://openalex.org/C2778061373","wikidata":"https://www.wikidata.org/wiki/Q1315146","display_name":"Predictive coding","level":3,"score":0.44904860854148865},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.1648852527141571},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.10404998064041138},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08052194118499756},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.18653/v1/p19-1590","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1590","pdf_url":"https://www.aclweb.org/anthology/P19-1590.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1906.02242","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.02242","pdf_url":"https://arxiv.org/pdf/1906.02242","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2948096105","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1906.02242v1","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1906.02242","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1906.02242","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1590","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1590","pdf_url":"https://www.aclweb.org/anthology/P19-1590.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2948096105.pdf","grobid_xml":"https://content.openalex.org/works/W2948096105.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W217970951","https://openalex.org/W1567570606","https://openalex.org/W1836465849","https://openalex.org/W1880262756","https://openalex.org/W2048679005","https://openalex.org/W2097089247","https://openalex.org/W2108281845","https://openalex.org/W2113459411","https://openalex.org/W2130339025","https://openalex.org/W2133556223","https://openalex.org/W2145451908","https://openalex.org/W2147946282","https://openalex.org/W2153579005","https://openalex.org/W2159426623","https://openalex.org/W2163568299","https://openalex.org/W2250473257","https://openalex.org/W2250533720","https://openalex.org/W2250539671","https://openalex.org/W2394658926","https://openalex.org/W2483215953","https://openalex.org/W2594155836","https://openalex.org/W2606347107","https://openalex.org/W2888329843","https://openalex.org/W2898700502","https://openalex.org/W2911681509","https://openalex.org/W2914331073","https://openalex.org/W2926555354","https://openalex.org/W2942203175","https://openalex.org/W2949416428","https://openalex.org/W2962739339","https://openalex.org/W2962897886","https://openalex.org/W2963012544","https://openalex.org/W2963026768","https://openalex.org/W2963223306","https://openalex.org/W2963269843","https://openalex.org/W2963341956","https://openalex.org/W2963600562","https://openalex.org/W2963773425","https://openalex.org/W2963858765","https://openalex.org/W2964121744","https://openalex.org/W3099531031","https://openalex.org/W6603175991"],"related_works":["https://openalex.org/W2963997607","https://openalex.org/W3196704128","https://openalex.org/W2951701153","https://openalex.org/W3122629327","https://openalex.org/W2963699875","https://openalex.org/W3127664874","https://openalex.org/W3090196146","https://openalex.org/W2394658926","https://openalex.org/W3206707760","https://openalex.org/W2809669277","https://openalex.org/W2798908575","https://openalex.org/W3103900065","https://openalex.org/W3104081646","https://openalex.org/W3037584823","https://openalex.org/W2742049800","https://openalex.org/W1876424772","https://openalex.org/W2891078859","https://openalex.org/W3193367109","https://openalex.org/W3199188153","https://openalex.org/W2342668609"],"abstract_inverted_index":{"We":[0,18,65,87],"introduce":[1],"VAMPIRE,":[2],"a":[3,20,25,40],"lightweight":[4],"pretraining":[5],"framework":[6],"for":[7],"effective":[8],"text":[9],"classification":[10],"when":[11,82],"data":[12,31,72],"and":[13,32,56,95],"computing":[14],"resources":[15],"are":[16],"limited.":[17],"pretrain":[19,94],"unigram":[21],"document":[22],"model":[23],"as":[24,37],"variational":[26],"autoencoder":[27],"on":[28],"in-domain,":[29],"unlabeled":[30],"use":[33,96],"its":[34],"internal":[35],"states":[36],"features":[38],"in":[39,99],"downstream":[41,100],"classifier.":[42],"Empirically,":[43],"we":[44],"show":[45],"the":[46],"relative":[47],"strength":[48],"of":[49],"VAMPIRE":[50,97],"against":[51],"computationally":[52],"expensive":[53],"contextual":[54,80],"embeddings":[55,81,98],"other":[57],"popular":[58],"semi-supervised":[59],"baselines":[60],"under":[61],"low":[62],"resource":[63],"settings.":[64],"also":[66],"find":[67],"that":[68],"fine-tuning":[69],"to":[70,75,93],"in-domain":[71],"is":[73],"crucial":[74],"achieving":[76],"decent":[77],"performance":[78],"from":[79],"working":[83],"with":[84,91],"limited":[85],"supervision.":[86],"accompany":[88],"this":[89],"paper":[90],"code":[92],"tasks.":[101]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":6},{"year":2020,"cited_by_count":3}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
