{"id":"https://openalex.org/W7119012018","doi":"https://doi.org/10.48550/arxiv.2601.02365","title":"FUSE : Failure-aware Usage of Subagent Evidence for MultiModal Search and Recommendation","display_name":"FUSE : Failure-aware Usage of Subagent Evidence for MultiModal Search and Recommendation","publication_year":2025,"publication_date":"2025-11-15","ids":{"openalex":"https://openalex.org/W7119012018","doi":"https://doi.org/10.48550/arxiv.2601.02365"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.02365","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.02365","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115023843","display_name":"Tushar Vatsa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vatsa, Tushar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069713931","display_name":"Vibha Belavadi","orcid":"https://orcid.org/0000-0002-1244-7702"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Belavadi, Vibha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5098767992","display_name":"Priya Shanmugasundaram","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shanmugasundaram, Priya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122212891","display_name":"Suhas Suresha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Suresha, Suhas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5095886520","display_name":"Dewang Sultania","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sultania, Dewang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.733299970626831,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.733299970626831,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.05490000173449516,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.03889999911189079,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6640999913215637},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6478000283241272},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.5602999925613403},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.48179998993873596},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.46320000290870667},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.446399986743927},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.42899999022483826},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.3580999970436096},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3546999990940094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7996000051498413},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6640999913215637},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6478000283241272},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5690000057220459},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.5602999925613403},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.48179998993873596},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.46320000290870667},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.446399986743927},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40630000829696655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40560001134872437},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.3580999970436096},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3546999990940094},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3257000148296356},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.325300008058548},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.3222000002861023},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C2781368080","wikidata":"https://www.wikidata.org/wiki/Q501688","display_name":"Context awareness","level":3,"score":0.29820001125335693},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.29030001163482666},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2727000117301941},{"id":"https://openalex.org/C201025465","wikidata":"https://www.wikidata.org/wiki/Q11248500","display_name":"User experience design","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C2780213375","wikidata":"https://www.wikidata.org/wiki/Q16340","display_name":"XPath","level":4,"score":0.2662999927997589},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2615000009536743},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C157659113","wikidata":"https://www.wikidata.org/wiki/Q533822","display_name":"WordNet","level":2,"score":0.25369998812675476},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.2533000111579895}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.02365","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.02365","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02365","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"creative":[1],"assistants":[2],"decompose":[3],"user":[4,29,95],"goals":[5],"and":[6,15,42,63,94,121,147,150,168,198,211],"route":[7],"tasks":[8],"to":[9],"subagents":[10],"for":[11,60],"layout,":[12],"styling,":[13],"retrieval,":[14],"generation.":[16],"Retrieval":[17],"quality":[18],"is":[19,45],"pivotal,":[20],"yet":[21],"failures":[22],"can":[23],"arise":[24],"at":[25],"several":[26],"stages:":[27],"understanding":[28],"intent,":[30],"choosing":[31],"content":[32],"types,":[33],"finding":[34],"candidates":[35],"(recall),":[36],"or":[37],"ranking":[38,151],"results.":[39],"Meanwhile,":[40],"sending":[41],"processing":[43],"images":[44],"costly,":[46],"making":[47],"naive":[48],"multimodal":[49],"approaches":[50],"impractical.":[51],"We":[52,154],"present":[53],"FUSE:":[54],"Failure-aware":[55],"Usage":[56],"of":[57,81],"Subagent":[58],"Evidence":[59],"MultiModal":[61],"Search":[62],"Recommendation.":[64],"FUSE":[65,102],"replaces":[66],"most":[67],"raw-image":[68],"prompting":[69],"with":[70,188],"a":[71,77,125],"compact":[72],"Grounded":[73],"Design":[74],"Representation":[75],"(GDR):":[76],"selection":[78,96],"aware":[79],"JSON":[80],"canvas":[82],"elements":[83],"(image,":[84],"text,":[85],"shape,":[86],"icon,":[87],"video,":[88],"logo),":[89],"structure,":[90],"styles,":[91],"salient":[92],"colors,":[93],"provided":[97],"by":[98,132],"the":[99,156],"Planner":[100],"team.":[101],"implements":[103],"seven":[104,157],"context":[105,111,158,206],"budgeting":[106,159],"strategies:":[107],"comprehensive":[108,210],"baseline":[109],"prompting,":[110],"compression,":[112],"chain-of-thought":[113],"reasoning,":[114],"mini-shot":[115],"optimization,":[116],"retrieval-augmented":[117],"context,":[118],"two-stage":[119],"processing,":[120],"zero-shot":[122],"minimalism.":[123],"Finally,":[124],"pipeline":[126,186],"attribution":[127],"layer":[128],"monitors":[129],"system":[130],"performance":[131,183],"converting":[133],"subagent":[134],"signals":[135],"into":[136],"simple":[137],"checks:":[138],"intent":[139,190],"alignment,":[140],"content-type/routing":[141],"sanity,":[142],"recall":[143],"health":[144],"(e.g.,":[145],"zero-hit":[146],"top-match":[148],"strength),":[149],"displacement":[152],"analysis.":[153],"evaluate":[155],"variants":[160],"across":[161,184],"788":[162],"evaluation":[163,176],"queries":[164],"from":[165],"diverse":[166],"users":[167],"design":[169],"templates":[170],"(refer":[171],"Figure":[172],"3).":[173],"Our":[174],"systematic":[175],"reveals":[177],"that":[178,204],"Context":[179],"Compression":[180],"achieves":[181],"optimal":[182],"all":[185],"stages,":[187],"93.3%":[189],"accuracy,":[191],"86.8%":[192],"routing":[193],"success(with":[194],"fallbacks),":[195],"99.4%":[196],"recall,":[197],"88.5%":[199],"NDCG@5.":[200],"This":[201],"approach":[202],"demonstrates":[203],"strategic":[205],"summarization":[207],"outperforms":[208],"both":[209],"minimal":[212],"contextualization":[213],"strategies.":[214]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-01-08T00:00:00"}
