{"id":"https://openalex.org/W2955732934","doi":"https://doi.org/10.1145/3331184.3331316","title":"Content-Based Weak Supervision for Ad-Hoc Re-Ranking","display_name":"Content-Based Weak Supervision for Ad-Hoc Re-Ranking","publication_year":2019,"publication_date":"2019-07-18","ids":{"openalex":"https://openalex.org/W2955732934","doi":"https://doi.org/10.1145/3331184.3331316","mag":"2955732934"},"language":"en","primary_location":{"id":"doi:10.1145/3331184.3331316","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3331184.3331316","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 42nd International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1707.00189","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014199889","display_name":"Sean MacAvaney","orcid":"https://orcid.org/0000-0002-8914-2659"},"institutions":[{"id":"https://openalex.org/I184565670","display_name":"Georgetown University","ror":"https://ror.org/05vzafd60","country_code":"US","type":"education","lineage":["https://openalex.org/I184565670"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sean MacAvaney","raw_affiliation_strings":["Georgetown University, Washington, DC, USA"],"affiliations":[{"raw_affiliation_string":"Georgetown University, Washington, DC, USA","institution_ids":["https://openalex.org/I184565670"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059489981","display_name":"Andrew Yates","orcid":"https://orcid.org/0000-0002-5970-880X"},"institutions":[{"id":"https://openalex.org/I4210109712","display_name":"Max Planck Institute for Informatics","ror":"https://ror.org/01w19ak89","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210109712"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Andrew Yates","raw_affiliation_strings":["Max Planck Institute for Informatics, Saarbr\u00fccken, Germany"],"affiliations":[{"raw_affiliation_string":"Max Planck Institute for Informatics, Saarbr\u00fccken, Germany","institution_ids":["https://openalex.org/I4210109712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017775632","display_name":"Kai Hui","orcid":"https://orcid.org/0000-0002-3110-7404"},"institutions":[{"id":"https://openalex.org/I4210089985","display_name":"Amazon (Germany)","ror":"https://ror.org/00b9ktm87","country_code":"DE","type":"company","lineage":["https://openalex.org/I1311688040","https://openalex.org/I4210089985"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Kai Hui","raw_affiliation_strings":["Amazon, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Amazon, Berlin, Germany","institution_ids":["https://openalex.org/I4210089985"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062591304","display_name":"Ophir Frieder","orcid":"https://orcid.org/0000-0001-5076-8171"},"institutions":[{"id":"https://openalex.org/I184565670","display_name":"Georgetown University","ror":"https://ror.org/05vzafd60","country_code":"US","type":"education","lineage":["https://openalex.org/I184565670"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ophir Frieder","raw_affiliation_strings":["Georgetown University, Washington, DC, USA"],"affiliations":[{"raw_affiliation_string":"Georgetown University, Washington, DC, USA","institution_ids":["https://openalex.org/I184565670"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5014199889"],"corresponding_institution_ids":["https://openalex.org/I184565670"],"apc_list":null,"apc_paid":null,"fwci":4.185,"has_fulltext":true,"cited_by_count":33,"citation_normalized_percentile":{"value":0.95303711,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"993","last_page":"996"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.8034242391586304},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7757425308227539},{"id":"https://openalex.org/keywords/paragraph","display_name":"Paragraph","score":0.6842203140258789},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.642815113067627},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6003821492195129},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5741585493087769},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5095415711402893},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.502842366695404},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49027588963508606},{"id":"https://openalex.org/keywords/headline","display_name":"Headline","score":0.48571452498435974},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4711773991584778},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.46272698044776917},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4281250834465027},{"id":"https://openalex.org/keywords/relevance-feedback","display_name":"Relevance feedback","score":0.42338353395462036},{"id":"https://openalex.org/keywords/labeled-data","display_name":"Labeled data","score":0.42215797305107117},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.39497989416122437},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11372047662734985},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.08072963356971741},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.07006624341011047}],"concepts":[{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.8034242391586304},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7757425308227539},{"id":"https://openalex.org/C2777206241","wikidata":"https://www.wikidata.org/wiki/Q194431","display_name":"Paragraph","level":2,"score":0.6842203140258789},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.642815113067627},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6003821492195129},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5741585493087769},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5095415711402893},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.502842366695404},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49027588963508606},{"id":"https://openalex.org/C2778689934","wikidata":"https://www.wikidata.org/wiki/Q1313396","display_name":"Headline","level":2,"score":0.48571452498435974},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4711773991584778},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.46272698044776917},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4281250834465027},{"id":"https://openalex.org/C2779532271","wikidata":"https://www.wikidata.org/wiki/Q445558","display_name":"Relevance feedback","level":4,"score":0.42338353395462036},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.42215797305107117},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.39497989416122437},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11372047662734985},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.08072963356971741},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.07006624341011047},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3331184.3331316","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3331184.3331316","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 42nd International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1707.00189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1707.00189","pdf_url":"https://arxiv.org/pdf/1707.00189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:pure.mpg.de:item_3184689","is_oa":false,"landing_page_url":"http://hdl.handle.net/21.11116/0000-0005-6B55-4","pdf_url":null,"source":{"id":"https://openalex.org/S4306400654","display_name":"MPG.PuRe (Max Planck Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149899117","host_organization_name":"Max Planck Society","host_organization_lineage":["https://openalex.org/I149899117"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"pmh:oai:pure.mpg.de:item_3184691","is_oa":true,"landing_page_url":"http://hdl.handle.net/21.11116/0000-0005-6B59-0","pdf_url":null,"source":{"id":"https://openalex.org/S4306400654","display_name":"MPG.PuRe (Max Planck Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149899117","host_organization_name":"Max Planck Society","host_organization_lineage":["https://openalex.org/I149899117"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/workingPaper"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1707.00189","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1707.00189","pdf_url":"https://arxiv.org/pdf/1707.00189","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5899999737739563,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2955732934.pdf","grobid_xml":"https://content.openalex.org/works/W2955732934.grobid-xml"},"referenced_works_count":22,"referenced_works":["https://openalex.org/W1982858363","https://openalex.org/W2113640060","https://openalex.org/W2126690248","https://openalex.org/W2159665776","https://openalex.org/W2159981039","https://openalex.org/W2429667833","https://openalex.org/W2536015822","https://openalex.org/W2610935556","https://openalex.org/W2616330167","https://openalex.org/W2619206542","https://openalex.org/W2648699835","https://openalex.org/W2740321901","https://openalex.org/W2752382061","https://openalex.org/W2783640434","https://openalex.org/W2810410758","https://openalex.org/W2837948978","https://openalex.org/W2887532538","https://openalex.org/W3101023724","https://openalex.org/W3158986179","https://openalex.org/W3212575067","https://openalex.org/W4297567729","https://openalex.org/W6795224213"],"related_works":["https://openalex.org/W2130553454","https://openalex.org/W3022007134","https://openalex.org/W4317548404","https://openalex.org/W2087783760","https://openalex.org/W3104108945","https://openalex.org/W2033364610","https://openalex.org/W3163689946","https://openalex.org/W2797776314","https://openalex.org/W2153927146","https://openalex.org/W2091066410"],"abstract_inverted_index":{"One":[0],"challenge":[1],"with":[2,20],"neural":[3,79,84],"ranking":[4,85],"is":[5],"the":[6,25],"need":[7],"for":[8,16,31],"a":[9,69,78],"large":[10],"amount":[11],"of":[12,27,64,97],"manually-labeled":[13],"relevance":[14,41],"judgments":[15],"training.":[17],"In":[18],"contrast":[19],"prior":[21,106],"work,":[22],"we":[23,92],"examine":[24],"use":[26],"weak":[28,89,107],"supervision":[29,90,108],"sources":[30,96],"training":[32,57,98],"that":[33,38,59,76,94,111],"yield":[34],"pseudo":[35],"query-document":[36],"pairs":[37,45,99],"already":[39],"exhibit":[40],"(e.g.,":[42],"newswire":[43],"headline-content":[44],"and":[46,72,87,110],"encyclopedic":[47],"heading-paragraph":[48],"pairs).":[49],"We":[50],"also":[51],"propose":[52],"filtering":[53,112],"techniques":[54],"to":[55],"eliminate":[56],"samples":[58],"are":[60,100],"too":[61],"far":[62],"out":[63],"domain":[65],"using":[66],"two":[67],"techniques:":[68],"heuristic-based":[70],"approach":[71],"novel":[73],"supervised":[74],"filter":[75],"re-purposes":[77],"ranker.":[80],"Using":[81],"several":[82],"leading":[83],"architectures":[86],"multiple":[88],"datasets,":[91],"show":[93],"these":[95],"effective":[101],"on":[102],"their":[103],"own":[104],"(outperforming":[105],"techniques),":[109],"can":[113],"further":[114],"improve":[115],"performance.":[116]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":12},{"year":2019,"cited_by_count":3}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
