{"id":"https://openalex.org/W7118980923","doi":"https://doi.org/10.48550/arxiv.2601.03011","title":"ReCCur: A Recursive Corner-Case Curation Framework for Robust Vision-Language Understanding in Open and Edge Scenarios","display_name":"ReCCur: A Recursive Corner-Case Curation Framework for Robust Vision-Language Understanding in Open and Edge Scenarios","publication_year":2026,"publication_date":"2026-01-06","ids":{"openalex":"https://openalex.org/W7118980923","doi":"https://doi.org/10.48550/arxiv.2601.03011"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.03011","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03011","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.03011","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122245711","display_name":"Yihan Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wei, Yihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050656216","display_name":"Shenghai Yuan","orcid":"https://orcid.org/0009-0000-4850-2278"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuan, Shenghai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122125025","display_name":"Tianchen Deng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deng, Tianchen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111287920","display_name":"Boyang Lou","orcid":"https://orcid.org/0009-0000-9071-4063"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lou, Boyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077221055","display_name":"Enwen Hu","orcid":"https://orcid.org/0000-0001-5019-3961"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Enwen","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5122245711"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6216999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6216999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.07829999923706055,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.04659999907016754,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5598000288009644},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5202999711036682},{"id":"https://openalex.org/keywords/validator","display_name":"Validator","score":0.4973999857902527},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4851999878883362},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.47690001130104065},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4332999885082245},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.4072999954223633},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.38670000433921814},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.38269999623298645},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.37059998512268066}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7964000105857849},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5598000288009644},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5202999711036682},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4999000132083893},{"id":"https://openalex.org/C35292069","wikidata":"https://www.wikidata.org/wiki/Q1575458","display_name":"Validator","level":2,"score":0.4973999857902527},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4851999878883362},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.47690001130104065},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.47429999709129333},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4334000051021576},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4332999885082245},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.4072999954223633},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.38670000433921814},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.38269999623298645},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35740000009536743},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.34209999442100525},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.3192000091075897},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.3151000142097473},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.29429998993873596},{"id":"https://openalex.org/C2776145971","wikidata":"https://www.wikidata.org/wiki/Q30673951","display_name":"Labeled data","level":2,"score":0.2890999913215637},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2809000015258789},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2777000069618225},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.27070000767707825},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2689000070095062},{"id":"https://openalex.org/C147497476","wikidata":"https://www.wikidata.org/wiki/Q54872","display_name":"RDF","level":3,"score":0.25949999690055847},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.2540999948978424},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.03011","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03011","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.03011","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03011","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Corner":[0],"cases":[1],"are":[2,13,21,24],"rare":[3],"or":[4],"extreme":[5],"scenarios":[6,146],"that":[7,41],"drive":[8],"real-world":[9],"failures,":[10],"but":[11],"they":[12],"difficult":[14],"to":[15,85,110,135],"curate":[16],"at":[17],"scale:":[18],"web":[19,44],"data":[20,57],"noisy,":[22],"labels":[23,49,138],"brittle,":[25],"and":[26,59,73,106,124,131,139,158,160,172,178],"edge":[27],"deployments":[28],"preclude":[29],"large":[30],"retraining.":[31],"We":[32],"present":[33],"ReCCur":[34,150],"(Recursive":[35],"Corner-Case":[36],"Curation),":[37],"a":[38,51,62,66,111,120,128,166],"low-compute":[39],"framework":[40],"converts":[42],"noisy":[43],"imagery":[45],"into":[46],"auditable":[47],"fine-grained":[48],"via":[50],"multi-agent":[52],"recursive":[53],"pipeline.":[54],"First,":[55],"large-scale":[56],"acquisition":[58],"filtering":[60],"expands":[61],"domain":[63],"vocabulary":[64],"with":[65,80,103,127],"vision-language":[67],"model":[68],"(VLM),":[69],"crawls":[70],"the":[71,141],"web,":[72],"enforces":[74],"tri-modal":[75],"(image,":[76],"description,":[77],"keyword)":[78],"consistency":[79],"light":[81],"human":[82,163],"spot":[83],"checks":[84],"yield":[86],"refined":[87],"candidates.":[88],"Next,":[89],"mixture-of-experts":[90],"knowledge":[91],"distillation":[92],"uses":[93],"complementary":[94],"encoders":[95],"(e.g.,":[96,147],"CLIP,":[97],"DINOv2,":[98],"BEiT)":[99],"for":[100,169],"kNN":[101],"voting":[102],"dual-confidence":[104],"activation":[105],"uncertainty":[107],"sampling,":[108],"converging":[109],"high-precision":[112],"set.":[113],"Finally,":[114],"region-evidence":[115],"VLM":[116],"adversarial":[117],"labeling":[118],"pairs":[119],"proposer":[121],"(multi-granularity":[122],"regions":[123],"semantic":[125],"cues)":[126],"validator":[129],"(global":[130],"local":[132],"chained":[133],"consistency)":[134],"produce":[136],"explainable":[137],"close":[140],"loop.":[142],"On":[143],"realistic":[144],"corner-case":[145],"flooded-car":[148],"inspection),":[149],"runs":[151],"on":[152],"consumer-grade":[153],"GPUs,":[154],"steadily":[155],"improves":[156],"purity":[157],"separability,":[159],"requires":[161],"minimal":[162],"supervision,":[164],"providing":[165],"practical":[167],"substrate":[168],"downstream":[170],"training":[171],"evaluation":[173],"under":[174],"resource":[175],"constraints.":[176],"Code":[177],"dataset":[179],"will":[180],"be":[181],"released.":[182]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
