{"id":"https://openalex.org/W4387225640","doi":"https://doi.org/10.48550/arxiv.2309.16540","title":"Unsupervised Pretraining for Fact Verification by Language Model Distillation","display_name":"Unsupervised Pretraining for Fact Verification by Language Model Distillation","publication_year":2023,"publication_date":"2023-09-28","ids":{"openalex":"https://openalex.org/W4387225640","doi":"https://doi.org/10.48550/arxiv.2309.16540"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2309.16540","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.16540","pdf_url":"https://arxiv.org/pdf/2309.16540","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2309.16540","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029139684","display_name":"Adri\u00e1n Bazaga","orcid":"https://orcid.org/0000-0002-1508-285X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bazaga, Adri\u00e1n","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056748708","display_name":"P\u00edetro Li\u00f3","orcid":"https://orcid.org/0000-0002-0540-5053"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li\u00f2, Pietro","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5048731023","display_name":"Gos Micklem","orcid":"https://orcid.org/0000-0002-6883-6168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Micklem, Gos","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5029139684"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9779000282287598,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8522029519081116},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6923633217811584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6858097314834595},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.5513338446617126},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5465986728668213},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.46394988894462585},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4564014971256256},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.42443040013313293},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.422471821308136}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8522029519081116},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6923633217811584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6858097314834595},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.5513338446617126},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5465986728668213},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.46394988894462585},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4564014971256256},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.42443040013313293},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.422471821308136},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2309.16540","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.16540","pdf_url":"https://arxiv.org/pdf/2309.16540","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2309.16540","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2309.16540","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2309.16540","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2309.16540","pdf_url":"https://arxiv.org/pdf/2309.16540","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.4699999988079071,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387225640.pdf","grobid_xml":"https://content.openalex.org/works/W4387225640.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2076536433","https://openalex.org/W90316445","https://openalex.org/W2069592018","https://openalex.org/W2075740387","https://openalex.org/W4327743613","https://openalex.org/W2965447900","https://openalex.org/W2358990940","https://openalex.org/W3199750033","https://openalex.org/W2374509987","https://openalex.org/W2093931120"],"abstract_inverted_index":{"Fact":[0,67],"verification":[1],"aims":[2],"to":[3,33,44,83,108],"verify":[4],"a":[5,10,35,73,100,129],"claim":[6,24,111],"using":[7],"evidence":[8,113],"from":[9],"trustworthy":[11],"knowledge":[12],"base.":[13],"To":[14],"address":[15],"this":[16],"challenge,":[17],"algorithms":[18],"must":[19],"produce":[20],"features":[21,86,107],"for":[22,94],"every":[23],"that":[25,78,105,127],"are":[26],"both":[27],"semantically":[28],"meaningful,":[29],"and":[30,59,112,136],"compact":[31],"enough":[32],"find":[34],"semantic":[36,118],"alignment":[37,50],"with":[38,140],"the":[39,49,92,117,121],"source":[40],"information.":[41],"In":[42],"contrast":[43],"previous":[45],"work,":[46],"which":[47],"tackled":[48],"problem":[51],"by":[52,99],"learning":[53],"over":[54],"annotated":[55],"corpora":[56],"of":[57],"claims":[58],"their":[60],"corresponding":[61],"labels,":[62],"we":[63,124],"propose":[64],"SFAVEL":[65],"(Self-supervised":[66],"Verification":[68],"via":[69],"Language":[70],"Model":[71],"Distillation),":[72],"novel":[74,101],"unsupervised":[75],"pretraining":[76],"framework":[77],"leverages":[79],"pre-trained":[80],"language":[81],"models":[82],"distil":[84],"self-supervised":[85],"into":[87],"high-quality":[88,110],"claim-fact":[89],"alignments":[90,114],"without":[91],"need":[93],"annotations.":[95],"This":[96],"is":[97],"enabled":[98],"contrastive":[102],"loss":[103],"function":[104],"encourages":[106],"attain":[109],"whilst":[115],"preserving":[116],"relationships":[119],"across":[120],"corpora.":[122],"Notably,":[123],"present":[125],"results":[126],"achieve":[128],"new":[130],"state-of-the-art":[131],"on":[132],"FB15k-237":[133],"(+5.3%":[134],"Hits@1)":[135],"FEVER":[137],"(+8%":[138],"accuracy)":[139],"linear":[141],"evaluation.":[142]},"counts_by_year":[],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2023-10-01T00:00:00"}
