{"id":"https://openalex.org/W7162459613","doi":"https://doi.org/10.48550/arxiv.2605.26086","title":"Claw-Anything: Benchmarking Always-On Personal Assistants with Broader Access to User's Digital World","display_name":"Claw-Anything: Benchmarking Always-On Personal Assistants with Broader Access to User's Digital World","publication_year":2026,"publication_date":"2026-05-25","ids":{"openalex":"https://openalex.org/W7162459613","doi":"https://doi.org/10.48550/arxiv.2605.26086"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.26086","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26086","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.26086","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137025714","display_name":"Yusong Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Yusong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137057483","display_name":"Xinyuan Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Xinyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137031333","display_name":"Haiyang Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haiyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017003276","display_name":"Qipeng Gu","orcid":"https://orcid.org/0000-0002-3151-6486"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Qipeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120717258","display_name":"Siqi Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Siqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137045318","display_name":"Jiangui Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiangui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137023349","display_name":"Shuzhe Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Shuzhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137074428","display_name":"Feiyang Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Feiyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064754069","display_name":"Lue Fan","orcid":"https://orcid.org/0000-0002-2349-0538"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Lue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137008238","display_name":"Sanyuan Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Sanyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137030937","display_name":"Dandan Tu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tu, Dandan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.13740000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.13740000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.12880000472068787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.09390000253915787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7741000056266785},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5914000272750854},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5625},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.5368000268936157},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5263000130653381},{"id":"https://openalex.org/keywords/interdependence","display_name":"Interdependence","score":0.5206999778747559},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5099999904632568},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.487199991941452}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7741000056266785},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6710000038146973},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5914000272750854},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5625},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.5368000268936157},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5263000130653381},{"id":"https://openalex.org/C185874996","wikidata":"https://www.wikidata.org/wiki/Q269699","display_name":"Interdependence","level":2,"score":0.5206999778747559},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5099999904632568},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.487199991941452},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.43050000071525574},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.39239999651908875},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.3855000138282776},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32760000228881836},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.3246999979019165},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.29739999771118164},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.28790000081062317},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.27950000762939453},{"id":"https://openalex.org/C114073186","wikidata":"https://www.wikidata.org/wiki/Q2631895","display_name":"Automated planning and scheduling","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2603999972343445},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.25380000472068787},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.26086","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26086","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.26086","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.26086","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.6356675028800964,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"model":[2,193],"agents":[3,140],"are":[4],"increasingly":[5],"envisioned":[6],"as":[7],"always-on":[8,56,172],"personal":[9,173],"assistants":[10],"with":[11],"access":[12],"to":[13,49,126,141],"anything":[14],"relevant":[15],"in":[16,52],"the":[17,134,169,176,191],"user's":[18],"digital":[19],"world.":[20],"Yet":[21],"current":[22,165],"systems":[23],"operate":[24],"over":[25,119],"only":[26,42,154],"narrow":[27],"slices":[28],"of":[29,96,136,171,199],"that":[30,67,151,184],"world,":[31],"limiting":[32],"context-sensitive":[33],"reasoning":[34],"and":[35,46,80,83,107,113,145,168,189],"effective":[36],"assistance.":[37,174],"Existing":[38],"benchmarks":[39],"similarly":[40],"provide":[41],"partial":[43],"user":[44,97,143],"state":[45],"therefore":[47],"fail":[48],"capture":[50],"performance":[51],"such":[53,127],"a":[54,65,162],"broad,":[55],"setting.":[57],"To":[58,89],"address":[59],"this":[60,91],"gap,":[61],"we":[62,93,178],"introduce":[63],"Claw-Anything,":[64],"benchmark":[66],"expands":[68],"agent":[69,166],"context":[70],"along":[71],"three":[72],"dimensions:":[73],"long-horizon":[74],"activity":[75,98],"histories,":[76],"interdependent":[77],"backend":[78],"services,":[79],"integrated":[81],"GUI":[82],"CLI":[84],"interaction":[85],"across":[86],"multiple":[87],"devices.":[88],"instantiate":[90],"setting,":[92],"simulate":[94],"months":[95],"through":[99],"multi-round":[100],"event":[101],"injection,":[102],"producing":[103],"complex":[104],"world":[105],"states":[106],"realistic":[108],"noise,":[109],"including":[110],"irrelevant":[111],"events":[112],"conflicting":[114],"signals.":[115],"Agents":[116],"must":[117],"reason":[118],"rich":[120],"contextual":[121],"environments":[122,188],"while":[123],"remaining":[124],"robust":[125],"noise.":[128],"This":[129],"expanded":[130],"scope":[131],"also":[132],"enables":[133],"evaluation":[135],"proactive":[137],"assistance,":[138],"requiring":[139],"anticipate":[142],"needs":[144],"deliver":[146],"timely":[147],"recommendations.":[148],"Experiments":[149],"show":[150],"GPT-5.5":[152],"achieves":[153],"34.5%":[155],"pass@1,":[156],"substantially":[157],"below":[158],"prior":[159],"benchmarks,":[160],"underscoring":[161],"gap":[163],"between":[164],"capabilities":[167],"demands":[170],"Alongside":[175],"benchmark,":[177],"release":[179],"an":[180],"automated":[181],"data-generation":[182],"pipeline":[183],"yields":[185],"2,000":[186],"training":[187],"improves":[190],"base":[192],"by":[194],"23.7%,":[195],"demonstrating":[196],"its":[197],"utility":[198],"scalable":[200],"data":[201],"infrastructure.":[202]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-27T00:00:00"}
