{"id":"https://openalex.org/W4416016992","doi":"https://doi.org/10.1145/3746252.3761238","title":"Constructing Set-Compositional and Negated Representations for First-Stage Ranking","display_name":"Constructing Set-Compositional and Negated Representations for First-Stage Ranking","publication_year":2025,"publication_date":"2025-11-07","ids":{"openalex":"https://openalex.org/W4416016992","doi":"https://doi.org/10.1145/3746252.3761238"},"language":null,"primary_location":{"id":"doi:10.1145/3746252.3761238","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3761238","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3746252.3761238","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086252961","display_name":"Antonios Minas Krasakis","orcid":"https://orcid.org/0000-0001-5040-7085"},"institutions":[{"id":"https://openalex.org/I4210135670","display_name":"Amsterdam University of the Arts","ror":"https://ror.org/04dde1554","country_code":"NL","type":"education","lineage":["https://openalex.org/I4210135670"]},{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Antonios Minas Krasakis","raw_affiliation_strings":["University of Amsterdam, Amsterdam, Netherlands"],"raw_orcid":"https://orcid.org/0000-0001-5040-7085","affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amsterdam, Netherlands","institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059489981","display_name":"Andrew Yates","orcid":"https://orcid.org/0000-0002-5970-880X"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Yates","raw_affiliation_strings":["HLTCOE, Johns Hopkins University, Baltimore, MD, USA"],"raw_orcid":"https://orcid.org/0000-0002-5970-880X","affiliations":[{"raw_affiliation_string":"HLTCOE, Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055639036","display_name":"Evangelos Kanoulas","orcid":"https://orcid.org/0000-0002-8312-0694"},"institutions":[{"id":"https://openalex.org/I4210135670","display_name":"Amsterdam University of the Arts","ror":"https://ror.org/04dde1554","country_code":"NL","type":"education","lineage":["https://openalex.org/I4210135670"]},{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Evangelos Kanoulas","raw_affiliation_strings":["University of Amsterdam, Amsterdam, Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-8312-0694","affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amsterdam, Netherlands","institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5086252961"],"corresponding_institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"],"apc_list":null,"apc_paid":null,"fwci":2.9051,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.93635903,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1406","last_page":"1416"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.3919999897480011,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.3919999897480011,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.12610000371932983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.0348999984562397,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6757000088691711},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.598800003528595},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5950999855995178},{"id":"https://openalex.org/keywords/negation","display_name":"Negation","score":0.538100004196167},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.4284999966621399},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4050000011920929},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.35030001401901245}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7537999749183655},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6757000088691711},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.603600025177002},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.598800003528595},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5950999855995178},{"id":"https://openalex.org/C2185349","wikidata":"https://www.wikidata.org/wiki/Q190558","display_name":"Negation","level":2,"score":0.538100004196167},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.4284999966621399},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42590001225471497},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4050000011920929},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.35030001401901245},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3422999978065491},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.33489999175071716},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29280000925064087},{"id":"https://openalex.org/C100643331","wikidata":"https://www.wikidata.org/wiki/Q205170","display_name":"Power set","level":3,"score":0.2874000072479248},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C89686163","wikidata":"https://www.wikidata.org/wiki/Q1187982","display_name":"Vector space model","level":2,"score":0.25839999318122864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746252.3761238","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3761238","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3746252.3761238","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3746252.3761238","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6620427566","display_name":null,"funder_award_id":"016.Vidi.189.039, VI.Vidi.223.166","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W74952720","https://openalex.org/W296439881","https://openalex.org/W1965943263","https://openalex.org/W2000672666","https://openalex.org/W2035798593","https://openalex.org/W2055113847","https://openalex.org/W2096468639","https://openalex.org/W2113989144","https://openalex.org/W2147844972","https://openalex.org/W2889787757","https://openalex.org/W3021397474","https://openalex.org/W3047936157","https://openalex.org/W3099843385","https://openalex.org/W3134384212","https://openalex.org/W3134665270","https://openalex.org/W3154280800","https://openalex.org/W3154755316","https://openalex.org/W3155114168","https://openalex.org/W3180230246","https://openalex.org/W4213259724","https://openalex.org/W4248510436","https://openalex.org/W4252076394","https://openalex.org/W4285287265","https://openalex.org/W4327499170","https://openalex.org/W4385570290","https://openalex.org/W4396821195"],"related_works":[],"abstract_inverted_index":{"Set":[0],"compositional":[1,52,137],"and":[2,12,41,61,111,131,144,154,169],"negated":[3,106,175],"queries":[4,42],"are":[5],"crucial":[6],"for":[7,50,159],"expressing":[8],"complex":[9],"information":[10],"needs":[11],"enable":[13],"the":[14,25,36,71,105,174],"discovery":[15],"of":[16,38,74,108,142,151],"niche":[17],"items":[18],"like":[19],"''Books":[20],"about":[21],"non-European":[22],"monarchs''.":[23],"Despite":[24],"recent":[26],"advances":[27],"in":[28,82],"LLMs,":[29],"first-stage":[30],"ranking":[31],"remains":[32],"challenging":[33],"due":[34],"to":[35,65,120,164],"requirement":[37],"encoding":[39],"documents":[40,68,172],"independently":[43],"from":[44],"each":[45],"other.":[46],"This":[47],"limitation":[48],"calls":[49],"constructing":[51,79],"query":[53],"representations":[54,81],"that":[55,102,116,125],"encapsulate":[56],"logical":[57],"operations":[58,88],"or":[59],"negations,":[60],"can":[62],"be":[63],"used":[64],"match":[66],"relevant":[67],"effectively.":[69],"In":[70],"first":[72],"part":[73],"this":[75],"work,":[76],"we":[77,98,148],"explore":[78],"such":[80],"a":[83,109,112],"zero-shot":[84,127],"setting":[85],"using":[86],"vector":[87],"between":[89],"lexically":[90],"grounded":[91],"Learned":[92],"Sparse":[93],"Retrieval":[94],"(LSR)":[95],"representations.":[96],"Specifically,":[97],"introduce":[99],"Disentangled":[100],"Negation":[101],"penalizes":[103],"only":[104],"parts":[107],"query,":[110],"Combined":[113],"Pseudo-Term":[114],"approach":[115,128],"enhances":[117],"LSR's":[118,156],"ability":[119],"handle":[121],"intersections.":[122],"We":[123],"find":[124],"our":[126],"is":[129],"competitive":[130],"often":[132],"outperforms":[133],"retrievers":[134],"fine-tuned":[135],"on":[136],"data,":[138],"highlighting":[139],"certain":[140],"limitations":[141,153],"LSR":[143],"Dense":[145],"Retrievers.":[146],"Finally,":[147],"address":[149],"some":[150],"these":[152],"improve":[155],"representation":[157],"power":[158],"negation,":[160],"by":[161],"allowing":[162],"them":[163],"attribute":[165],"negative":[166],"term":[167],"scores":[168],"effectively":[170],"penalize":[171],"containing":[173],"terms.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-11-08T00:00:00"}
