{"id":"https://openalex.org/W7134043144","doi":"https://doi.org/10.48550/arxiv.2603.04751","title":"Evaluating the Search Agent in a Parallel World","display_name":"Evaluating the Search Agent in a Parallel World","publication_year":2026,"publication_date":"2026-03-05","ids":{"openalex":"https://openalex.org/W7134043144","doi":"https://doi.org/10.48550/arxiv.2603.04751"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.04751","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128266208","display_name":"Jiawei Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Jiawei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128263535","display_name":"Xintian Shen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Xintian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128238171","display_name":"Lihao Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Lihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128228005","display_name":"Lifu Mu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mu, Lifu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128227538","display_name":"Haoyi Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Haoyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012881558","display_name":"Ning Mao","orcid":"https://orcid.org/0000-0001-7514-252X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mao, Ning","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128276476","display_name":"Hao Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062578450","display_name":"Tao Wei","orcid":"https://orcid.org/0000-0002-4765-1826"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128255696","display_name":"Pan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Pan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128269865","display_name":"Kun Zhan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhan, Kun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5128266208"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.7867000102996826,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.7867000102996826,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.0544000007212162,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.04520000144839287,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.7116000056266785},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5843999981880188},{"id":"https://openalex.org/keywords/situated","display_name":"Situated","score":0.5317999720573425},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5297999978065491},{"id":"https://openalex.org/keywords/semantic-search","display_name":"Semantic search","score":0.5109000205993652},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.48339998722076416},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.4796999990940094},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.4250999987125397},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.40860000252723694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7896000146865845},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.7116000056266785},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5843999981880188},{"id":"https://openalex.org/C132829578","wikidata":"https://www.wikidata.org/wiki/Q581151","display_name":"Situated","level":2,"score":0.5317999720573425},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5297999978065491},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5210999846458435},{"id":"https://openalex.org/C166423231","wikidata":"https://www.wikidata.org/wiki/Q1891170","display_name":"Semantic search","level":3,"score":0.5109000205993652},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.48339998722076416},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.4796999990940094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43479999899864197},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.4250999987125397},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.40860000252723694},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.4043000042438507},{"id":"https://openalex.org/C173979980","wikidata":"https://www.wikidata.org/wiki/Q114106","display_name":"Metasearch engine","level":4,"score":0.39959999918937683},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3977000117301941},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.39719998836517334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38600000739097595},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.3517000079154968},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.3504999876022339},{"id":"https://openalex.org/C37202355","wikidata":"https://www.wikidata.org/wiki/Q7188071","display_name":"Phrase search","level":5,"score":0.34139999747276306},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3174000084400177},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30640000104904175},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.303600013256073},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C171089853","wikidata":"https://www.wikidata.org/wiki/Q7094123","display_name":"Online search","level":2,"score":0.27720001339912415},{"id":"https://openalex.org/C201789804","wikidata":"https://www.wikidata.org/wiki/Q2362762","display_name":"Search problem","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.2694000005722046},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.25209999084472656},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.04751","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.04751","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.04751","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.04751","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.6874374151229858,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Integrating":[0],"web":[1],"search":[2,30,98,107,214,237],"tools":[3],"has":[4],"significantly":[5],"extended":[6],"the":[7,146,176],"capability":[8],"of":[9,158,172],"LLMs":[10],"to":[11,66,75,138],"address":[12,115],"open-world,":[13],"real-time,":[14],"and":[15,69,99,142,162,233,246],"long-tail":[16],"problems.":[17],"However,":[18],"evaluating":[19,125],"these":[20,116,190],"Search":[21,126],"Agents":[22,127],"presents":[23],"formidable":[24],"challenges.":[25],"First,":[26],"constructing":[27],"high-quality":[28],"deep":[29,57],"benchmarks":[31,46],"is":[32,87,226],"prohibitively":[33],"expensive,":[34],"while":[35,213],"unverified":[36],"synthetic":[37],"data":[38],"often":[39,59,88],"suffers":[40],"from":[41],"unreliable":[42,242],"sources.":[43],"Second,":[44],"static":[45],"face":[47],"dynamic":[48],"obsolescence:":[49],"as":[50,83],"internet":[51],"information":[52],"evolves,":[53],"complex":[54],"queries":[55],"requiring":[56],"research":[58],"degrade":[60],"into":[61],"simple":[62],"retrieval":[63],"tasks":[64],"due":[65,74],"increased":[67],"popularity,":[68],"ground":[70],"truths":[71],"become":[72],"outdated":[73],"temporal":[76],"shifts.":[77],"Third,":[78],"attribution":[79],"ambiguity":[80],"confounds":[81],"evaluation,":[82,170],"an":[84,197],"agent's":[85],"performance":[86,225],"dominated":[89],"by":[90,230,241],"its":[91,96],"parametric":[92],"memory":[93],"rather":[94],"than":[95],"actual":[97],"reasoning":[100],"capabilities.":[101],"Finally,":[102],"reliance":[103],"on":[104],"specific":[105],"commercial":[106],"engines":[108],"introduces":[109],"variability":[110],"that":[111,184],"hampers":[112],"reproducibility.":[113],"To":[114],"issues,":[117],"we":[118],"propose":[119],"a":[120,129,156,163,180],"novel":[121],"framework,":[122],"Mind-ParaWorld,":[123],"for":[124,166],"in":[128,189,235],"Parallel":[130],"World.":[131],"Specifically,":[132],"MPW":[133],"samples":[134],"real-world":[135,174],"entity":[136],"names":[137],"synthesize":[139],"future":[140],"scenarios":[141],"questions":[143],"situated":[144],"beyond":[145],"model's":[147],"knowledge":[148],"cutoff.":[149],"A":[150],"ParaWorld":[151,181],"Law":[152],"Model":[153,183],"then":[154],"constructs":[155],"set":[157],"indivisible":[159],"Atomic":[160,192],"Facts":[161],"unique":[164],"ground-truth":[165],"each":[167],"question.":[168],"During":[169],"instead":[171],"retrieving":[173],"results,":[175],"agent":[177],"interacts":[178],"with":[179,203],"Engine":[182],"dynamically":[185],"generates":[186],"SERPs":[187],"grounded":[188],"inviolable":[191],"Facts.":[193],"We":[194],"release":[195],"MPW-Bench,":[196],"interactive":[198],"benchmark":[199],"spanning":[200],"19":[201],"domains":[202],"1,608":[204],"instances.":[205],"Experiments":[206],"across":[207],"three":[208],"evaluation":[209],"settings":[210],"show":[211],"that,":[212],"agents":[215],"are":[216],"strong":[217],"at":[218],"evidence":[219,231,243],"synthesis":[220],"given":[221],"complete":[222],"information,":[223],"their":[224],"limited":[227],"not":[228],"only":[229],"collection":[232],"coverage":[234],"unfamiliar":[236],"environments,":[238],"but":[239],"also":[240],"sufficiency":[244],"judgment":[245],"when-to-stop":[247],"decisions-bottlenecks.":[248]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-07T00:00:00"}
