{"id":"https://openalex.org/W4384823501","doi":"https://doi.org/10.1145/3539618.3591805","title":"Tevatron: An Efficient and Flexible Toolkit for Neural Retrieval","display_name":"Tevatron: An Efficient and Flexible Toolkit for Neural Retrieval","publication_year":2023,"publication_date":"2023-07-18","ids":{"openalex":"https://openalex.org/W4384823501","doi":"https://doi.org/10.1145/3539618.3591805"},"language":"en","primary_location":{"id":"doi:10.1145/3539618.3591805","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3539618.3591805","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060885692","display_name":"Luyu Gao","orcid":"https://orcid.org/0009-0006-5806-3022"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Luyu Gao","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021623012","display_name":"Xueguang Ma","orcid":"https://orcid.org/0000-0003-3430-4910"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Xueguang Ma","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082997975","display_name":"Jimmy Lin","orcid":"https://orcid.org/0000-0002-0661-7189"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jimmy Lin","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009879041","display_name":"Jamie Callan","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jamie Callan","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5060885692"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":2.7653,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.92175059,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3120","last_page":"3124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tevatron","display_name":"Tevatron","score":0.8342776298522949},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8276734352111816},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5312119722366333},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5254349112510681},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.5234886407852173},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4944603443145752},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.48489195108413696},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.42051127552986145},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42034512758255005},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3363344669342041},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32149165868759155},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.23547783493995667},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.16671475768089294},{"id":"https://openalex.org/keywords/large-hadron-collider","display_name":"Large Hadron Collider","score":0.13288703560829163},{"id":"https://openalex.org/keywords/particle-physics","display_name":"Particle physics","score":0.0860578715801239}],"concepts":[{"id":"https://openalex.org/C2780715337","wikidata":"https://www.wikidata.org/wiki/Q944533","display_name":"Tevatron","level":3,"score":0.8342776298522949},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8276734352111816},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5312119722366333},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5254349112510681},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.5234886407852173},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4944603443145752},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.48489195108413696},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.42051127552986145},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42034512758255005},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3363344669342041},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32149165868759155},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.23547783493995667},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.16671475768089294},{"id":"https://openalex.org/C87668248","wikidata":"https://www.wikidata.org/wiki/Q40605","display_name":"Large Hadron Collider","level":2,"score":0.13288703560829163},{"id":"https://openalex.org/C109214941","wikidata":"https://www.wikidata.org/wiki/Q18334","display_name":"Particle physics","level":1,"score":0.0860578715801239},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3539618.3591805","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3539618.3591805","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2165548363","display_name":null,"funder_award_id":"Canada","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"},{"id":"https://openalex.org/G8284766523","display_name":null,"funder_award_id":"(NSERC)","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1516184288","https://openalex.org/W2124509324","https://openalex.org/W2252136820","https://openalex.org/W2602856279","https://openalex.org/W2912924812","https://openalex.org/W2963339397","https://openalex.org/W2963469388","https://openalex.org/W2963748441","https://openalex.org/W2970971581","https://openalex.org/W2998702515","https://openalex.org/W3045462440","https://openalex.org/W3099700870","https://openalex.org/W3154280800","https://openalex.org/W3168875417","https://openalex.org/W3169937871","https://openalex.org/W3180230246","https://openalex.org/W3184918446","https://openalex.org/W3185250692","https://openalex.org/W3188983256","https://openalex.org/W4206121183","https://openalex.org/W4225156005","https://openalex.org/W4226208814","https://openalex.org/W4284682639","https://openalex.org/W4295312788","https://openalex.org/W6601899773"],"related_works":["https://openalex.org/W1623752107","https://openalex.org/W4205895067","https://openalex.org/W3001020873","https://openalex.org/W1538124858","https://openalex.org/W2061531839","https://openalex.org/W1858011642","https://openalex.org/W1637783486","https://openalex.org/W2950264794","https://openalex.org/W4242558101","https://openalex.org/W2541069095"],"abstract_inverted_index":{"Recent":[0],"rapid":[1],"advances":[2],"in":[3,17,130],"deep":[4],"pre-trained":[5],"language":[6],"models":[7],"and":[8,67,74,88,104,121,136,141,157,161,185],"the":[9],"introduction":[10],"of":[11,29,46,79,128],"large":[12],"datasets":[13],"have":[14,26],"powered":[15],"research":[16,24,43,176],"embedding-based":[18],"neural":[19,58,178],"retrieval.":[20],"While":[21],"many":[22],"excellent":[23],"papers":[25],"emerged,":[27],"most":[28],"them":[30],"come":[31],"with":[32],"their":[33,182],"own":[34],"implementations,":[35],"which":[36,149],"are":[37],"typically":[38],"optimized":[39,63],"for":[40,64,76,112,175],"some":[41],"particular":[42],"goals":[44],"instead":[45],"efficiency":[47,137],"or":[48],"code":[49,68],"organization.":[50],"In":[51,106],"this":[52,131],"paper,":[53,132],"we":[54,164],"introduce":[55],"Tevatron,":[56],"a":[57,77,93,171],"retrieval":[59,179],"toolkit":[60],"that":[61,96,166],"is":[62],"efficiency,":[65],"flexibility,":[66],"simplicity.":[69],"Tevatron":[70,108,129,167],"enables":[71,150],"model":[72,100,155],"training":[73],"evaluation":[75],"variety":[78],"ranking":[80],"components":[81],"such":[82,116],"as":[83,117,170],"dense":[84],"retrievers,":[85,87],"sparse":[86],"rerankers.":[89],"It":[90],"also":[91],"provides":[92],"standardized":[94],"pipeline":[95],"includes":[97],"text":[98],"processing,":[99],"training,":[101],"corpus/query":[102],"encoding,":[103],"search.":[105],"addition,":[107],"incorporates":[109],"well-studied":[110],"methods":[111],"improving":[113],"retriever":[114],"effectiveness":[115,135],"hard":[118],"negative":[119],"mining":[120],"knowledge":[122],"distillation.":[123],"We":[124,144],"provide":[125],"an":[126],"overview":[127],"demonstrating":[133],"its":[134],"on":[138,177],"multiple":[139],"IR":[140],"QA":[142],"datasets.":[143],"highlight":[145],"Tevatron's":[146],"flexible":[147],"design,":[148,183],"easy":[151],"generalization":[152],"across":[153],"datasets,":[154],"architectures,":[156],"accelerator":[158],"platforms":[159],"(GPUs":[160],"TPUs).":[162],"Overall,":[163],"believe":[165],"can":[168],"serve":[169],"solid":[172],"software":[173],"foundation":[174],"systems,":[180],"including":[181],"modeling,":[184],"optimization.":[186]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":6}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
