{"id":"https://openalex.org/W4414359293","doi":"https://doi.org/10.24963/ijcai.2025/1153","title":"Paradigms of AI Evaluation: Mapping Goals, Methodologies and Culture","display_name":"Paradigms of AI Evaluation: Mapping Goals, Methodologies and Culture","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4414359293","doi":"https://doi.org/10.24963/ijcai.2025/1153"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2025/1153","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/1153","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044048765","display_name":"John Burden","orcid":"https://orcid.org/0000-0001-7526-0753"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I2802641067","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802641067"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"John Burden","raw_affiliation_strings":["Leverhulme Centre for the Future of Intelligence, University of Cambridge"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Leverhulme Centre for the Future of Intelligence, University of Cambridge","institution_ids":["https://openalex.org/I2802641067","https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011322547","display_name":"Marko Te\u0161i\u0107","orcid":"https://orcid.org/0000-0003-3368-7024"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I2802641067","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802641067"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marko Te\u0161i\u0107","raw_affiliation_strings":["Leverhulme Centre for the Future of Intelligence, University of Cambridge"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Leverhulme Centre for the Future of Intelligence, University of Cambridge","institution_ids":["https://openalex.org/I2802641067","https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018689327","display_name":"Lorenzo Pacchiardi","orcid":"https://orcid.org/0000-0003-4760-7638"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I2802641067","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802641067"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lorenzo Pacchiardi","raw_affiliation_strings":["Leverhulme Centre for the Future of Intelligence, University of Cambridge"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Leverhulme Centre for the Future of Intelligence, University of Cambridge","institution_ids":["https://openalex.org/I2802641067","https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029864546","display_name":"Jos\u00e9 Hern\u00e1ndez\u2010Orallo","orcid":"https://orcid.org/0000-0001-9746-7632"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]},{"id":"https://openalex.org/I2802641067","display_name":"Leverhulme Trust","ror":"https://ror.org/012mzw131","country_code":"GB","type":"nonprofit","lineage":["https://openalex.org/I2802641067"]},{"id":"https://openalex.org/I60053951","display_name":"Universitat Polit\u00e8cnica de Val\u00e8ncia","ror":"https://ror.org/01460j859","country_code":"ES","type":"education","lineage":["https://openalex.org/I60053951"]}],"countries":["ES","GB"],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Hern\u00e1ndez-Orallo","raw_affiliation_strings":["Leverhulme Centre for the Future of Intelligence, University of Cambridge","Universitat Polit\u00e8cnica de Val\u00e8ncia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Leverhulme Centre for the Future of Intelligence, University of Cambridge","institution_ids":["https://openalex.org/I2802641067","https://openalex.org/I241749"]},{"raw_affiliation_string":"Universitat Polit\u00e8cnica de Val\u00e8ncia","institution_ids":["https://openalex.org/I60053951"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.1936,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.95501767,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"10381","last_page":"10390"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12805","display_name":"Cognitive Science and Mapping","score":0.3434999883174896,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12805","display_name":"Cognitive Science and Mapping","score":0.3434999883174896,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.6118999719619751},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5012000203132629},{"id":"https://openalex.org/keywords/fragmentation","display_name":"Fragmentation (computing)","score":0.43549999594688416},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4251999855041504}],"concepts":[{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.6118999719619751},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.5367000102996826},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5012000203132629},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45579999685287476},{"id":"https://openalex.org/C191015642","wikidata":"https://www.wikidata.org/wiki/Q1132459","display_name":"Fragmentation (computing)","level":2,"score":0.43549999594688416},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4251999855041504},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.37459999322891235},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.34299999475479126},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.32019999623298645},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C55587333","wikidata":"https://www.wikidata.org/wiki/Q1133029","display_name":"Engineering ethics","level":1,"score":0.29019999504089355},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.26100000739097595},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25540000200271606},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.2540999948978424}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2025/1153","is_oa":false,"landing_page_url":"https://doi.org/10.24963/ijcai.2025/1153","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Thirty-Fourth International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Research":[0],"in":[1,27,70,77,142],"AI":[2,63,79],"evaluation":[3,21,80,129],"has":[4,39],"grown":[5],"increasingly":[6],"complex":[7],"and":[8,15,32,45,52,82,103,113,131],"multidisciplinary,":[9],"attracting":[10],"researchers":[11],"with":[12,53,116],"diverse":[13],"backgrounds":[14],"objectives.":[16],"As":[17],"a":[18],"result,":[19],"divergent":[20],"paradigms":[22,51],"have":[23],"emerged,":[24],"often":[25],"developing":[26],"isolation,":[28],"adopting":[29],"conflicting":[30],"terminologies,":[31],"overlooking":[33],"each":[34,93,117],"other's":[35],"contributions.":[36],"This":[37],"fragmentation":[38],"led":[40],"to":[41,58,99,121,145],"insular":[42],"research":[43,104,148],"trajectories":[44],"communication":[46],"barriers":[47],"both":[48],"among":[49],"different":[50,135],"the":[54,78,108,125,143],"general":[55],"public,":[56],"contributing":[57],"unmet":[59],"expectations":[60],"for":[61],"deployed":[62],"systems.":[64],"To":[65],"help":[66],"bridge":[67],"this":[68,71],"insularity,":[69],"paper":[72],"we":[73,119],"survey":[74],"recent":[75,90],"work":[76],"landscape":[81],"identify":[83,139],"six":[84],"main":[85],"paradigms.":[86,136],"We":[87,137],"characterise":[88],"major":[89],"contributions":[91],"within":[92],"paradigm":[94],"across":[95],"key":[96],"dimensions":[97],"related":[98],"their":[100],"goals,":[101],"methodologies":[102],"cultures.":[105],"By":[106],"clarifying":[107],"unique":[109],"combination":[110],"of":[111,124,127],"questions":[112],"approaches":[114,130],"associated":[115],"paradigm,":[118],"aim":[120],"increase":[122],"awareness":[123],"breadth":[126],"current":[128],"foster":[132],"cross-pollination":[133],"between":[134],"also":[138],"potential":[140],"gaps":[141],"field":[144],"inspire":[146],"future":[147],"directions.":[149]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-14T07:44:22.658603","created_date":"2025-10-10T00:00:00"}
