{"id":"https://openalex.org/W7138970347","doi":"https://doi.org/10.48550/arxiv.2603.16932","title":"Look Where It Matters: High-Resolution Crops Retrieval for Efficient VLMs","display_name":"Look Where It Matters: High-Resolution Crops Retrieval for Efficient VLMs","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138970347","doi":"https://doi.org/10.48550/arxiv.2603.16932"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16932","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16932","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16932","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129869140","display_name":"Nimrod Shabtay","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shabtay, Nimrod","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046832314","display_name":"Moshe Kimhi","orcid":"https://orcid.org/0009-0000-7645-7339"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kimhi, Moshe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058222100","display_name":"Artem Spector","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spector, Artem","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130133256","display_name":"Sivan Haray","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haray, Sivan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024009299","display_name":"Ehud Rivlin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rivlin, Ehud","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130026464","display_name":"Chaim Baskin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baskin, Chaim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072571599","display_name":"Raja Giryes","orcid":"https://orcid.org/0000-0002-2830-0297"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giryes, Raja","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129809186","display_name":"Eli Schwartz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwartz, Eli","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5129869140"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9366999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9366999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.007799999788403511,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.007699999958276749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.7260000109672546},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6983000040054321},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.6208000183105469},{"id":"https://openalex.org/keywords/forcing","display_name":"Forcing (mathematics)","score":0.6169999837875366},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5958999991416931},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5860999822616577},{"id":"https://openalex.org/keywords/cropping","display_name":"Cropping","score":0.4512999951839447},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.3828999996185303}],"concepts":[{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.7260000109672546},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6983000040054321},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6614999771118164},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.6208000183105469},{"id":"https://openalex.org/C197115733","wikidata":"https://www.wikidata.org/wiki/Q1003136","display_name":"Forcing (mathematics)","level":2,"score":0.6169999837875366},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5958999991416931},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5860999822616577},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4681999981403351},{"id":"https://openalex.org/C13558536","wikidata":"https://www.wikidata.org/wiki/Q785116","display_name":"Cropping","level":3,"score":0.4512999951839447},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4090000092983246},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38749998807907104},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.3828999996185303},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.36070001125335693},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.3240000009536743},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32350000739097595},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.28760001063346863},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2554999887943268}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16932","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16932","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16932","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16932","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-language":[0],"models":[1],"(VLMs)":[2],"typically":[3],"process":[4],"images":[5],"at":[6],"a":[7,11,46,57,71,79,108,129],"native":[8],"high-resolution,":[9],"forcing":[10],"trade-off":[12,53],"between":[13],"accuracy":[14],"and":[15,61,92],"computational":[16,26],"efficiency:":[17],"high-resolution":[18,67,84],"inputs":[19,30],"capture":[20],"fine":[21],"details":[22],"but":[23],"incur":[24],"significant":[25],"costs,":[27],"while":[28],"low-resolution":[29,58],"advocate":[31],"for":[32,70,100],"efficiency,":[33],"they":[34],"potentially":[35],"miss":[36],"critical":[37],"visual":[38],"information,":[39],"like":[40],"small":[41],"text.":[42],"We":[43,74,117],"present":[44],"AwaRes,":[45],"spatial-on-demand":[47],"framework":[48,120],"that":[49,132],"resolves":[50],"this":[51],"accuracy-efficiency":[52],"by":[54,125],"operating":[55],"on":[56],"global":[59],"view":[60],"using":[62],"tool-calling":[63],"to":[64,86,107,112],"retrieve":[65],"only":[66],"segments":[68],"needed":[69],"given":[72],"query.":[73],"construct":[75],"supervised":[76],"data":[77],"automatically:":[78],"judge":[80],"compares":[81],"low-":[82],"vs.\\":[83],"answers":[85],"label":[87],"whether":[88],"cropping":[89],"is":[90],"needed,":[91],"an":[93],"oracle":[94],"grounding":[95],"model":[96],"localizes":[97],"the":[98,101],"evidence":[99],"correct":[102],"answer,":[103],"which":[104],"we":[105],"map":[106],"discrete":[109],"crop":[110],"set":[111],"form":[113],"multi-turn":[114,126],"tool-use":[115],"trajectories.":[116],"train":[118],"our":[119],"with":[121,128,137],"cold-start":[122],"SFT":[123],"followed":[124],"GRPO":[127],"composite":[130],"reward":[131],"combines":[133],"semantic":[134],"answer":[135],"correctness":[136],"explicit":[138],"crop-cost":[139],"penalties.":[140],"Project":[141],"page:":[142],"https://nimrodshabtay.github.io/AwaRes":[143]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
