{"id":"https://openalex.org/W3018814697","doi":"https://doi.org/10.1145/3397271.3401211","title":"Learning Term Discrimination","display_name":"Learning Term Discrimination","publication_year":2020,"publication_date":"2020-07-25","ids":{"openalex":"https://openalex.org/W3018814697","doi":"https://doi.org/10.1145/3397271.3401211","mag":"3018814697"},"language":"en","primary_location":{"id":"doi:10.1145/3397271.3401211","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3397271.3401211","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2004.11759","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005643082","display_name":"Jibril Frej","orcid":"https://orcid.org/0009-0009-0631-0636"},"institutions":[{"id":"https://openalex.org/I4210104430","display_name":"Laboratoire d'Informatique de Grenoble","ror":"https://ror.org/01c8rcg82","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210104430","https://openalex.org/I4210159245","https://openalex.org/I899635006","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Jibril Frej","raw_affiliation_strings":["LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France"],"affiliations":[{"raw_affiliation_string":"LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France","institution_ids":["https://openalex.org/I4210104430","https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000438626","display_name":"Phillipe Mulhem","orcid":null},"institutions":[{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]},{"id":"https://openalex.org/I4210104430","display_name":"Laboratoire d'Informatique de Grenoble","ror":"https://ror.org/01c8rcg82","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210104430","https://openalex.org/I4210159245","https://openalex.org/I899635006","https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Philippe Mulhem","raw_affiliation_strings":["LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France"],"affiliations":[{"raw_affiliation_string":"LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France","institution_ids":["https://openalex.org/I4210104430","https://openalex.org/I899635006"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013799481","display_name":"Didier Schwab","orcid":"https://orcid.org/0000-0002-2462-8148"},"institutions":[{"id":"https://openalex.org/I4210104430","display_name":"Laboratoire d'Informatique de Grenoble","ror":"https://ror.org/01c8rcg82","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210104430","https://openalex.org/I4210159245","https://openalex.org/I899635006","https://openalex.org/I899635006"]},{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Didier Schwab","raw_affiliation_strings":["LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France"],"affiliations":[{"raw_affiliation_string":"LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France","institution_ids":["https://openalex.org/I4210104430","https://openalex.org/I899635006"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108156680","display_name":"Jean\u2013Pierre Chevallet","orcid":null},"institutions":[{"id":"https://openalex.org/I899635006","display_name":"Universit\u00e9 Grenoble Alpes","ror":"https://ror.org/02rx3b187","country_code":"FR","type":"education","lineage":["https://openalex.org/I899635006"]},{"id":"https://openalex.org/I4210104430","display_name":"Laboratoire d'Informatique de Grenoble","ror":"https://ror.org/01c8rcg82","country_code":"FR","type":"facility","lineage":["https://openalex.org/I106785703","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I4210104430","https://openalex.org/I4210159245","https://openalex.org/I899635006","https://openalex.org/I899635006"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jean-Pierre Chevallet","raw_affiliation_strings":["LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France"],"affiliations":[{"raw_affiliation_string":"LIG - Laboratoire d'Informatique de Grenoble, Grenoble (38), France","institution_ids":["https://openalex.org/I4210104430","https://openalex.org/I899635006"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5005643082"],"corresponding_institution_ids":["https://openalex.org/I4210104430","https://openalex.org/I899635006"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.04042052,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1993","last_page":"1996"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8070589303970337},{"id":"https://openalex.org/keywords/term-discrimination","display_name":"Term Discrimination","score":0.7742905020713806},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.7069947123527527},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6849931478500366},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6512842178344727},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6272258758544922},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6084602475166321},{"id":"https://openalex.org/keywords/tf\u2013idf","display_name":"tf\u2013idf","score":0.6079502701759338},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.566595196723938},{"id":"https://openalex.org/keywords/inverted-index","display_name":"Inverted index","score":0.5208066701889038},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.5156830549240112},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4940545856952667},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47858548164367676},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4596308171749115},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4548996686935425},{"id":"https://openalex.org/keywords/vector-space-model","display_name":"Vector space model","score":0.43208351731300354},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.18629449605941772},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.10459724068641663},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09308740496635437},{"id":"https://openalex.org/keywords/concept-search","display_name":"Concept search","score":0.0930357277393341}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8070589303970337},{"id":"https://openalex.org/C22639730","wikidata":"https://www.wikidata.org/wiki/Q7702546","display_name":"Term Discrimination","level":5,"score":0.7742905020713806},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.7069947123527527},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6849931478500366},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6512842178344727},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6272258758544922},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6084602475166321},{"id":"https://openalex.org/C81758059","wikidata":"https://www.wikidata.org/wiki/Q796584","display_name":"tf\u2013idf","level":3,"score":0.6079502701759338},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.566595196723938},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.5208066701889038},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.5156830549240112},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4940545856952667},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47858548164367676},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4596308171749115},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4548996686935425},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.43208351731300354},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.18629449605941772},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.10459724068641663},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09308740496635437},{"id":"https://openalex.org/C182861755","wikidata":"https://www.wikidata.org/wiki/Q5158391","display_name":"Concept search","level":4,"score":0.0930357277393341},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1145/3397271.3401211","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3397271.3401211","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 43rd International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2004.11759","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2004.11759","pdf_url":"https://arxiv.org/pdf/2004.11759","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:3018814697","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/2004.11759.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:HAL:hal-03024756v1","is_oa":true,"landing_page_url":"https://hal.science/hal-03024756","pdf_url":null,"source":null,"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://sigir.org/sigir2020/","raw_type":"Conference papers"},{"id":"doi:10.48550/arxiv.2004.11759","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2004.11759","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2004.11759","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2004.11759","pdf_url":"https://arxiv.org/pdf/2004.11759","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.7099999785423279,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1908696901","https://openalex.org/W2064203736","https://openalex.org/W2110963081","https://openalex.org/W2134557008","https://openalex.org/W2136542423","https://openalex.org/W2155482025","https://openalex.org/W2165612380","https://openalex.org/W2271840356","https://openalex.org/W2536015822","https://openalex.org/W2539671052","https://openalex.org/W2783640434","https://openalex.org/W2897754576","https://openalex.org/W2962772361","https://openalex.org/W2964121744","https://openalex.org/W2964254569","https://openalex.org/W3098620803","https://openalex.org/W4252076394"],"related_works":["https://openalex.org/W3034868781","https://openalex.org/W2060772891","https://openalex.org/W2188767364","https://openalex.org/W2028747520","https://openalex.org/W2465801315","https://openalex.org/W2051274382","https://openalex.org/W2003984229","https://openalex.org/W2045517286","https://openalex.org/W2975751652","https://openalex.org/W2554132354","https://openalex.org/W2009593660","https://openalex.org/W2527562421","https://openalex.org/W2093270409","https://openalex.org/W3154755316","https://openalex.org/W3023238803","https://openalex.org/W2413524007","https://openalex.org/W2135290016","https://openalex.org/W1702656447","https://openalex.org/W2125398996","https://openalex.org/W2763456122"],"abstract_inverted_index":{"Document":[0],"indexing":[1,70],"is":[2,144],"a":[3,35,38],"key":[4],"component":[5],"for":[6,68],"efficient":[7],"information":[8],"retrieval":[9,141,151],"(IR).":[10],"After":[11],"preprocessing":[12],"steps":[13],"such":[14,48,81],"as":[15,49,82,105],"stemming":[16],"and":[17,84,94,137],"stop-word":[18],"removal,":[19],"document":[20,51,69],"indexes":[21],"usually":[22],"store":[23],"term-frequencies":[24],"(tf).":[25],"Along":[26],"with":[27,71,99],"tf":[28],"(that":[29],"only":[30],"reflects":[31],"the":[32,118,130,134,140],"importance":[33],"of":[34,92,117,133],"term":[36,44],"in":[37,90],"document),":[39],"traditional":[40,77,96],"IR":[41,78],"models":[42],"use":[43],"discrimination":[45,123],"values":[46],"(TDVs)":[47],"inverse":[50],"frequency":[52],"(idf)":[53],"to":[54,65,113,126,146],"favor":[55],"discriminative":[56],"terms":[57,91,116],"during":[58],"retrieval.":[59],"In":[60],"this":[61],"work,":[62],"we":[63],"propose":[64],"learn":[66],"TDVs":[67],"shallow":[72],"neural":[73],"networks":[74],"that":[75,120],"approximate":[76],"ranking":[79],"functions":[80],"TF-IDF":[83],"BM25.":[85],"Our":[86,108],"proposal":[87],"outperforms,":[88],"both":[89,127],"nDCG":[93],"recall,":[95],"approaches,":[97],"even":[98],"few":[100],"positively":[101],"labelled":[102],"query-document":[103],"pairs":[104],"learning":[106],"data.":[107],"learned":[109],"TDVs,":[110],"when":[111],"used":[112],"filter":[114],"out":[115],"vocabulary":[119],"have":[121],"zero":[122],"value,":[124],"allow":[125],"significantly":[128],"lower":[129],"memory":[131],"footprint":[132],"inverted":[135],"index":[136],"speed":[138],"up":[139,145],"process":[142],"(BM25":[143],"3~times":[147],"faster),":[148],"without":[149],"degrading":[150],"quality.":[152]},"counts_by_year":[],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
