{"id":"https://openalex.org/W7131859348","doi":"https://doi.org/10.48550/arxiv.2602.22638","title":"MobilityBench: A Benchmark for Evaluating Route-Planning Agents in Real-World Mobility Scenarios","display_name":"MobilityBench: A Benchmark for Evaluating Route-Planning Agents in Real-World Mobility Scenarios","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131859348","doi":"https://doi.org/10.48550/arxiv.2602.22638"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.22638","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127271734","display_name":"Zhiheng Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Song, Zhiheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127262803","display_name":"Jingshuai Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jingshuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102883290","display_name":"Chuan Qin","orcid":"https://orcid.org/0000-0002-5354-8630"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Chuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127460134","display_name":"Chao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Chao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127242019","display_name":"Chao Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Chao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125905324","display_name":"Longfei Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Longfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127180355","display_name":"Kaikui Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Kaikui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127264428","display_name":"Xiangxiang Chu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chu, Xiangxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121755810","display_name":"Hengshu Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Hengshu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5127271734"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.25099998712539673,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.25099998712539673,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.22910000383853912,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.09359999746084213,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.8348000049591064},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6909999847412109},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.5320000052452087},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.5281000137329102},{"id":"https://openalex.org/keywords/sandbox","display_name":"Sandbox (software development)","score":0.4970000088214874},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.4846000075340271},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.36959999799728394}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.8348000049591064},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7379999756813049},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6909999847412109},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.5320000052452087},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.5281000137329102},{"id":"https://openalex.org/C167981075","wikidata":"https://www.wikidata.org/wiki/Q2667186","display_name":"Sandbox (software development)","level":2,"score":0.4970000088214874},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.4846000075340271},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39590001106262207},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.36959999799728394},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33169999718666077},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3278999924659729},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.326200008392334},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3140000104904175},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.31349998712539673},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3012000024318695},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2750999927520752},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2778068325","wikidata":"https://www.wikidata.org/wiki/Q19892785","display_name":"Individual mobility","level":2,"score":0.25999999046325684},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.22638","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.22638","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22638","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.22638","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Route-planning":[0],"agents":[1,59,135],"powered":[2],"by":[3,36,118],"large":[4],"language":[5,21],"models":[6,156],"(LLMs)":[7],"have":[8],"emerged":[9],"as":[10],"a":[11,52,78,95,109],"promising":[12],"paradigm":[13],"for":[14,55,177],"supporting":[15],"everyday":[16],"human":[17],"mobility":[18,32,62,139,181],"through":[19],"natural":[20],"interaction":[22],"and":[23,43,76,126,141,149,163,191],"tool-mediated":[24],"decision":[25],"making.":[26],"However,":[27],"systematic":[28],"evaluation":[29,111,189],"in":[30,60,179],"real-world":[31,61,138],"settings":[33],"is":[34,65],"hindered":[35],"diverse":[37,137],"routing":[38],"demands,":[39],"non-deterministic":[40],"mapping":[41],"services,":[42],"limited":[44],"reproducibility.":[45],"In":[46],"this":[47],"study,":[48],"we":[49,93,130],"introduce":[50],"MobilityBench,":[51,129],"scalable":[53],"benchmark":[54,187],"evaluating":[56],"LLM-based":[57,133],"route-planning":[58,82,134],"scenarios.":[63],"MobilityBench":[64],"constructed":[66],"from":[67,74,103],"large-scale,":[68],"anonymized":[69],"real":[70],"user":[71],"queries":[72],"collected":[73],"Amap":[75],"covers":[77],"broad":[79],"spectrum":[80],"of":[81,120,146],"intents":[83],"across":[84,136],"multiple":[85,132],"cities":[86],"worldwide.":[87],"To":[88],"enable":[89],"reproducible,":[90],"end-to-end":[91],"evaluation,":[92],"design":[94],"deterministic":[96],"API-replay":[97],"sandbox":[98],"that":[99,154],"eliminates":[100],"environmental":[101],"variance":[102],"live":[104],"services.":[105],"We":[106,183],"further":[107],"propose":[108],"multi-dimensional":[110],"protocol":[112],"centered":[113],"on":[114,159],"outcome":[115],"validity,":[116],"complemented":[117],"assessments":[119],"instruction":[121],"understanding,":[122],"planning,":[123],"tool":[124],"use,":[125],"efficiency.":[127],"Using":[128],"evaluate":[131],"scenarios":[140],"provide":[142],"an":[143],"in-depth":[144],"analysis":[145],"their":[147],"behaviors":[148],"performance.":[150],"Our":[151],"findings":[152],"reveal":[153],"current":[155],"perform":[157],"competently":[158],"Basic":[160],"information":[161],"retrieval":[162],"Route":[164,172],"Planning":[165],"tasks,":[166],"yet":[167],"struggle":[168],"considerably":[169],"with":[170],"Preference-Constrained":[171],"Planning,":[173],"underscoring":[174],"significant":[175],"room":[176],"improvement":[178],"personalized":[180],"applications.":[182],"publicly":[184],"release":[185],"the":[186],"data,":[188],"toolkit,":[190],"documentation":[192],"at":[193],"https://github.com/AMAP-ML/MobilityBench":[194],".":[195]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-28T00:00:00"}
