{"id":"https://openalex.org/W7151627296","doi":"https://doi.org/10.48550/arxiv.2604.04651","title":"Search, Do not Guess: Teaching Small Language Models to Be Effective Search Agents","display_name":"Search, Do not Guess: Teaching Small Language Models to Be Effective Search Agents","publication_year":2026,"publication_date":"2026-04-06","ids":{"openalex":"https://openalex.org/W7151627296","doi":"https://doi.org/10.48550/arxiv.2604.04651"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.04651","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04651","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.04651","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133124376","display_name":"Yizhou Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yizhou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133122697","display_name":"Qi Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133144002","display_name":"Yulin Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yulin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133065664","display_name":"Siyue Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Siyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133105642","display_name":"Chen Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3549000024795532,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3549000024795532,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1315000057220459,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.06859999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4487999975681305},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.40700000524520874},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.3937000036239624},{"id":"https://openalex.org/keywords/spurious-relationship","display_name":"Spurious relationship","score":0.3659999966621399},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.3418000042438507},{"id":"https://openalex.org/keywords/soundness","display_name":"Soundness","score":0.3224000036716461}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7297000288963318},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4575999975204468},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4487999975681305},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41179999709129333},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.40700000524520874},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3937000036239624},{"id":"https://openalex.org/C97256817","wikidata":"https://www.wikidata.org/wiki/Q1462316","display_name":"Spurious relationship","level":2,"score":0.3659999966621399},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.3418000042438507},{"id":"https://openalex.org/C39920170","wikidata":"https://www.wikidata.org/wiki/Q693083","display_name":"Soundness","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.28040000796318054},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.25609999895095825},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.04651","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04651","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.04651","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04651","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Agents":[0],"equipped":[1],"with":[2],"search":[3,30,66,132,144],"tools":[4,67],"have":[5],"emerged":[6],"as":[7],"effective":[8],"solutions":[9],"for":[10,29,146],"knowledge-intensive":[11],"tasks.":[12],"While":[13],"Large":[14],"Language":[15,45],"Models":[16,46],"(LLMs)":[17],"exhibit":[18],"strong":[19],"reasoning":[20,54],"capabilities,":[21],"their":[22],"high":[23],"computational":[24],"cost":[25],"limits":[26],"practical":[27],"deployment":[28],"agents.":[31],"Consequently,":[32],"recent":[33],"work":[34],"has":[35],"focused":[36],"on":[37,51,114,119],"distilling":[38],"agentic":[39],"behaviors":[40],"from":[41,105],"LLMs":[42],"into":[43],"Small":[44],"(SLMs).":[47],"Through":[48],"comprehensive":[49],"evaluation":[50],"complex":[52],"multi-hop":[53],"tasks,":[55],"we":[56,80],"find":[57],"that":[58,87,130],"despite":[59],"possessing":[60],"less":[61,68],"parametric":[62],"knowledge,":[63],"SLMs":[64,90,135],"invoke":[65],"frequently":[69],"and":[70,94,116],"are":[71],"more":[72],"prone":[73],"to":[74,91,102],"hallucinations.":[75],"To":[76],"address":[77],"this":[78],"issue,":[79],"propose":[81],"\\policy,":[82],"a":[83],"lightweight":[84],"fine-tuning":[85],"approach":[86,108],"explicitly":[88],"trains":[89],"reliably":[92],"retrieve":[93],"generate":[95],"answers":[96],"grounded":[97],"in":[98,134],"retrieved":[99],"evidence.":[100],"Compared":[101],"agent":[103],"distillation":[104],"LLMs,":[106],"our":[107],"improves":[109],"performance":[110],"by":[111],"17.3":[112],"scores":[113,118],"Bamboogle":[115],"15.3":[117],"HotpotQA,":[120],"achieving":[121],"LLM-level":[122],"results":[123],"across":[124],"benchmarks.":[125],"Our":[126],"further":[127],"analysis":[128],"reveals":[129],"adaptive":[131],"strategies":[133],"often":[136],"degrade":[137],"performance,":[138],"highlighting":[139],"the":[140],"necessity":[141],"of":[142],"consistent":[143],"behavior":[145],"reliable":[147],"reasoning.":[148]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-08T00:00:00"}
