{"id":"https://openalex.org/W4400528870","doi":"https://doi.org/10.1145/3626772.3657992","title":"LLM4Eval: Large Language Model for Evaluation in IR","display_name":"LLM4Eval: Large Language Model for Evaluation in IR","publication_year":2024,"publication_date":"2024-07-10","ids":{"openalex":"https://openalex.org/W4400528870","doi":"https://doi.org/10.1145/3626772.3657992"},"language":"en","primary_location":{"id":"doi:10.1145/3626772.3657992","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3626772.3657992","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3626772.3657992","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044972686","display_name":"Hossein A. Rahmani","orcid":"https://orcid.org/0000-0002-2779-4942"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Hossein A. Rahmani","raw_affiliation_strings":["University College London, London, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London, London, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052291325","display_name":"Clemencia Siro","orcid":"https://orcid.org/0000-0001-5301-4244"},"institutions":[{"id":"https://openalex.org/I4210135670","display_name":"Amsterdam University of the Arts","ror":"https://ror.org/04dde1554","country_code":"NL","type":"education","lineage":["https://openalex.org/I4210135670"]},{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Clemencia Siro","raw_affiliation_strings":["University of Amsterdam, Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amsterdam, Netherlands","institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063466614","display_name":"Mohammad Aliannejadi","orcid":"https://orcid.org/0000-0002-9447-4172"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mohammad Aliannejadi","raw_affiliation_strings":["University of Amsterdam, Amstedam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amstedam, Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055132321","display_name":"Nick Craswell","orcid":"https://orcid.org/0000-0002-9351-8137"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I58610484","display_name":"Seattle University","ror":"https://ror.org/02jqc0m91","country_code":"US","type":"education","lineage":["https://openalex.org/I58610484"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nick Craswell","raw_affiliation_strings":["Microsoft, Seattle, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Seattle, USA","institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I58610484"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037737168","display_name":"Charles L. A. Clarke","orcid":"https://orcid.org/0000-0001-8178-9194"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Charles L. A. Clarke","raw_affiliation_strings":["University of Waterloo, Waterloo, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079246354","display_name":"Guglielmo Faggioli","orcid":"https://orcid.org/0000-0002-5070-2049"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Guglielmo Faggioli","raw_affiliation_strings":["University of Padua, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padua, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048533217","display_name":"Bhaskar Mitra","orcid":"https://orcid.org/0000-0002-5270-5550"},"institutions":[{"id":"https://openalex.org/I4210153468","display_name":"Microsoft (Canada)","ror":"https://ror.org/04xhxg104","country_code":"CA","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210153468"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Bhaskar Mitra","raw_affiliation_strings":["Microsoft, Montreal, QC, Canada"],"affiliations":[{"raw_affiliation_string":"Microsoft, Montreal, QC, Canada","institution_ids":["https://openalex.org/I4210153468"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046377370","display_name":"Paul Thomas","orcid":"https://orcid.org/0000-0003-2425-3136"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Paul Thomas","raw_affiliation_strings":["Microsoft, Adelaide, Australia"],"affiliations":[{"raw_affiliation_string":"Microsoft, Adelaide, Australia","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101716010","display_name":"Emine Yilmaz","orcid":"https://orcid.org/0000-0003-4734-4532"},"institutions":[{"id":"https://openalex.org/I4210123934","display_name":"Amazon (United Kingdom)","ror":"https://ror.org/02xey9634","country_code":"GB","type":"company","lineage":["https://openalex.org/I1311688040","https://openalex.org/I4210123934"]},{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Emine Yilmaz","raw_affiliation_strings":["University College London &amp; Amazon, London, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University College London &amp; Amazon, London, United Kingdom","institution_ids":["https://openalex.org/I4210123934","https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":5,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5044972686"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":null,"apc_paid":null,"fwci":6.4727,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.97069379,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3040","last_page":"3043"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9805999994277954,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9724000096321106,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6963107585906982},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.4136735200881958},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4078904390335083}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6963107585906982},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4136735200881958},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4078904390335083}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3626772.3657992","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3626772.3657992","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:dare.uva.nl:openaire_cris_publications/a9d321ea-dd78-4321-a79d-7eca8b0597b0","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/llm4eval-large-language-model-for-evaluation-in-ir(a9d321ea-dd78-4321-a79d-7eca8b0597b0).html","pdf_url":"https://pure.uva.nl/ws/files/244504343/3626772.3657992.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Rahmani, H A, Siro, C, Aliannejadi, M, Craswell, N, Clarke, C L A, Faggioli, G, Mitra, B, Thomas, P & Yilmaz, E 2024, LLM4Eval: Large Language Model for Evaluation in IR. in SIGIR '24 : Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval : July 14-18, 2024, Washington, DC, USA. Association for Computing Machinery, New York, NY, pp. 3040-3043, 47th International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR 2024, Washington, United States, 14/07/24. https://doi.org/10.1145/3626772.3657992","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:www.research.unipd.it:11577/3555946","is_oa":true,"landing_page_url":"https://hdl.handle.net/11577/3555946","pdf_url":null,"source":{"id":"https://openalex.org/S4377196283","display_name":"Research Padua  Archive (University of Padua)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I138689650","host_organization_name":"University of Padua","host_organization_lineage":["https://openalex.org/I138689650"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"doi:10.1145/3626772.3657992","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3626772.3657992","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 47th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.6800000071525574,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1361938442","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4583412171","display_name":null,"funder_award_id":"EP/S021566/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7114785046","display_name":"Task Based Information Retrieval","funder_award_id":"EP/P024289/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7929798828","display_name":null,"funder_award_id":"EP/P024289/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8719353587","display_name":null,"funder_award_id":"EP/P0","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320321008","display_name":"Universiteit van Amsterdam","ror":"https://ror.org/04dkp9463"},{"id":"https://openalex.org/F4320321014","display_name":"Vrije Universiteit Amsterdam","ror":"https://ror.org/008xxew50"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W3027879771","https://openalex.org/W4385688511","https://openalex.org/W4389518874","https://openalex.org/W4389519254","https://openalex.org/W4400530533","https://openalex.org/W4401043313"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Large":[0],"language":[1,48],"models":[2,37],"(LLMs)":[3],"have":[4,38],"demonstrated":[5],"increasing":[6],"task-solving":[7],"abilities":[8],"not":[9],"present":[10],"in":[11,30,41,108,128],"smaller":[12],"models.":[13],"Utilizing":[14],"the":[15,42,58,147,170,183],"capabilities":[16],"and":[17,50,74,98,122,176,179],"responsibilities":[18],"of":[19,44,78,88,104,124,169,186],"LLMs":[20,79,105,125],"for":[21,106,126,157],"automated":[22,45,112,142],"evaluation":[23,107,127],"(LLM4Eval)":[24],"has":[25],"recently":[26],"attracted":[27],"considerable":[28],"attention":[29],"multiple":[31],"research":[32,68],"communities.":[33],"For":[34],"instance,":[35],"LLM4Eval":[36,83,89],"been":[39],"studied":[40],"context":[43],"judgments,":[46,113],"natural":[47],"generation,":[49],"retrieval":[51,60],"augmented":[52],"generation":[53,115],"systems.":[54],"We":[55,136],"believe":[56],"that":[57],"information":[59,109],"community":[61],"can":[62],"significantly":[63],"contribute":[64],"to":[65,82,92,100,130,139,146,154,181],"this":[66],"growing":[67],"area":[69],"by":[70],"designing,":[71],"implementing,":[72],"analyzing,":[73],"evaluating":[75],"various":[76,102],"aspects":[77,103],"with":[80,164],"applications":[81],"tasks.":[84],"The":[85,167],"main":[86],"goal":[87],"workshop":[90,171],"is":[91,172],"bring":[93],"together":[94],"researchers":[95],"from":[96],"industry":[97],"academia":[99],"discuss":[101],"retrieval,":[110],"including":[111,174],"retrieval-augmented":[114],"pipeline":[116],"evaluation,":[117,120],"altering":[118],"human":[119,165],"robustness,":[121],"trustworthiness":[123],"addition":[129],"their":[131],"impact":[132],"on":[133],"real-world":[134],"applications.":[135],"also":[137],"plan":[138],"run":[140],"an":[141],"judgment":[143],"challenge":[144],"prior":[145],"workshop,":[148],"where":[149],"participants":[150],"will":[151],"be":[152],"asked":[153],"generate":[155],"labels":[156],"a":[158,187],"given":[159],"dataset":[160],"while":[161],"maximising":[162],"correlation":[163],"judgments.":[166],"format":[168],"interactive,":[173],"roundtable":[175],"keynote":[177],"sessions":[178],"tends":[180],"avoid":[182],"one-sided":[184],"dialogue":[185],"mini-conference.":[188]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
