{"id":"https://openalex.org/W4392126166","doi":"https://doi.org/10.48550/arxiv.2402.14005","title":"Relying on the Metrics of Evaluated Agents","display_name":"Relying on the Metrics of Evaluated Agents","publication_year":2024,"publication_date":"2024-02-21","ids":{"openalex":"https://openalex.org/W4392126166","doi":"https://doi.org/10.48550/arxiv.2402.14005"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.14005","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.14005","pdf_url":"https://arxiv.org/pdf/2402.14005","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.14005","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047154233","display_name":"Serena Wang","orcid":"https://orcid.org/0000-0002-5532-071X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Serena","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049812527","display_name":"Michael I. Jordan","orcid":"https://orcid.org/0000-0001-8935-817X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jordan, Michael I.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076701535","display_name":"Katrina Ligett","orcid":"https://orcid.org/0000-0003-2780-6656"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ligett, Katrina","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5089940510","display_name":"R. Preston McAfee","orcid":"https://orcid.org/0000-0002-2587-3161"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McAfee, R. Preston","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047154233"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.4894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.4894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/agency","display_name":"Agency (philosophy)","score":0.733302652835846},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.33393263816833496},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.33178606629371643},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3246335983276367},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.16702845692634583},{"id":"https://openalex.org/keywords/social-science","display_name":"Social science","score":0.06548982858657837}],"concepts":[{"id":"https://openalex.org/C108170787","wikidata":"https://www.wikidata.org/wiki/Q3951828","display_name":"Agency (philosophy)","level":2,"score":0.733302652835846},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33393263816833496},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.33178606629371643},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3246335983276367},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.16702845692634583},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.06548982858657837}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.14005","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.14005","pdf_url":"https://arxiv.org/pdf/2402.14005","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2402.14005","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.14005","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.14005","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.14005","pdf_url":"https://arxiv.org/pdf/2402.14005","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392126166.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"Online":[0],"platforms":[1],"and":[2,17,120,146,164],"regulators":[3],"face":[4,49],"a":[5,96,137],"continuing":[6],"problem":[7,28],"of":[8,29,38,45,50,95],"designing":[9],"effective":[10],"evaluation":[11],"metrics.":[12],"While":[13],"tools":[14],"for":[15,160],"collecting":[16],"processing":[18],"data":[19,171],"continue":[20],"to":[21,56,68,91,98,108,135,154],"progress,":[22],"this":[23,51,75],"has":[24],"not":[25],"addressed":[26],"the":[27,39,43,48,57,93,113,118,125,131,162],"\"unknown":[30],"unknowns\",":[31],"or":[32],"fundamental":[33],"informational":[34,52],"limitations":[35],"on":[36,170],"part":[37],"evaluator.":[40,165],"To":[41],"guide":[42],"choice":[44],"metrics":[46,110,122],"in":[47],"problem,":[53],"we":[54,82],"turn":[55],"evaluated":[58],"agents":[59],"themselves,":[60],"who":[61],"may":[62],"have":[63,88],"more":[64],"information":[65],"about":[66],"how":[67],"measure":[69],"their":[70,99],"own":[71],"outcomes.":[72],"We":[73,101,127,166],"model":[74],"interaction":[76],"as":[77],"an":[78,86,89,104,151],"agency":[79],"game,":[80],"where":[81],"ask:":[83],"\"When":[84],"does":[85],"agent":[87,105,132,163],"incentive":[90],"reveal":[92,109,136],"observability":[94],"metric":[97,138],"evaluator?\"":[100],"show":[102,129],"that":[103,111,123,130,156],"will":[106],"prefer":[107,134],"differentiate":[112,124],"most":[114],"difficult":[115],"tasks":[116],"from":[117,172],"rest,":[119],"conceal":[121],"easiest.":[126],"further":[128],"can":[133],"\"garbled\"":[139],"with":[140],"noise":[141],"over":[142],"both":[143,161],"fully":[144,147],"concealing":[145],"revealing.":[148],"This":[149],"indicates":[150],"economic":[152],"value":[153],"privacy":[155],"yields":[157],"Pareto":[158],"improvement":[159],"demonstrate":[167],"these":[168],"findings":[169],"online":[173],"rideshare":[174],"platforms.":[175]},"counts_by_year":[],"updated_date":"2026-03-14T08:43:22.919905","created_date":"2024-02-24T00:00:00"}
