{"id":"https://openalex.org/W7156814507","doi":"https://doi.org/10.48550/arxiv.2604.22990","title":"Hard to See, Hard to Label: Generative and Symbolic Acquisition for Subtle Visual Phenomena","display_name":"Hard to See, Hard to Label: Generative and Symbolic Acquisition for Subtle Visual Phenomena","publication_year":2026,"publication_date":"2026-04-24","ids":{"openalex":"https://openalex.org/W7156814507","doi":"https://doi.org/10.48550/arxiv.2604.22990"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.22990","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22990","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.22990","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134781713","display_name":"Renjith Prasad","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Prasad, Renjith","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134752949","display_name":"Rishabh Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Rishabh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079718238","display_name":"Andrew Shao","orcid":"https://orcid.org/0000-0003-3658-512X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Andrew E.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056133417","display_name":"Annmary Justine Koomthanam","orcid":"https://orcid.org/0009-0002-8282-6190"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koomthanam, Annmary Justine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134795972","display_name":"Shreyas Kulkarni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kulkarni, Shreyas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105513963","display_name":"Suparna Bhattacharya","orcid":"https://orcid.org/0000-0001-9541-4027"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhattacharya, Suparna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071889037","display_name":"Martin Folt\u00edn","orcid":"https://orcid.org/0000-0002-3386-0272"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Foltin, Martin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110087061","display_name":"Amit Sheth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheth, Amit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134767244","display_name":"David Orozco","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Orozco, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134758232","display_name":"Brian Sammuli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quinn, Matthew","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Sammuli, Brian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sammuli, Brian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5134781713"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.4860000014305115,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.4860000014305115,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.14309999346733093,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.08049999922513962,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.6542999744415283},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.5940999984741211},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48010000586509705},{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.44850000739097595},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.44440001249313354},{"id":"https://openalex.org/keywords/scene-graph","display_name":"Scene graph","score":0.421999990940094},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.39959999918937683},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.39329999685287476},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3799000084400177}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7233999967575073},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6837000250816345},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.6542999744415283},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.5940999984741211},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48010000586509705},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.44850000739097595},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.44440001249313354},{"id":"https://openalex.org/C179372163","wikidata":"https://www.wikidata.org/wiki/Q1406181","display_name":"Scene graph","level":3,"score":0.421999990940094},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.39959999918937683},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39559999108314514},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.39329999685287476},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38119998574256897},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3799000084400177},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3718999922275543},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.34929999709129333},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.34709998965263367},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.27799999713897705},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.27649998664855957},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.2759000062942505},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.22990","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22990","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.22990","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22990","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7994728684425354,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Subtle":[0],"visual":[1,164],"anomalies":[2,66],"such":[3],"as":[4],"hairline":[5],"cracks,":[6],"sub-millimeter":[7],"voids,":[8],"and":[9,24,71,108,113,150,174,192,202,208],"low-contrast":[10],"inclusions":[11],"are":[12,178],"structurally":[13],"atypical":[14,118],"yet":[15,48],"visually":[16,117],"ambiguous,":[17],"making":[18],"them":[19],"both":[20,69],"difficult":[21,72],"to":[22,26,73],"annotate":[23],"easy":[25],"overlook":[27],"during":[28],"active":[29,85],"learning.":[30],"Standard":[31],"acquisition":[32,128,160],"heuristics":[33],"based":[34],"on":[35,185],"discriminative":[36],"uncertainty":[37],"or":[38,119],"feature":[39],"diversity":[40],"often":[41,179],"overselect":[42],"dominant":[43,135],"patterns":[44],"while":[45,157],"underexploring":[46],"sparse":[47],"important":[49],"regions":[50,156],"of":[51,153,172],"the":[52],"data":[53],"space.":[54],"This":[55],"failure":[56],"mode":[57],"is":[58],"especially":[59],"severe":[60],"in":[61,145,199],"industrial":[62],"defect":[63],"inspection,":[64],"where":[65],"may":[67],"be":[68],"low-prevalence":[70],"distinguish":[74],"from":[75,129],"surrounding":[76],"structure.":[77],"To":[78],"resolve":[79],"this,":[80],"we":[81],"propose":[82],"GSAL,":[83],"an":[84],"learning":[86],"framework":[87],"for":[88],"object":[89],"detection":[90],"that":[91,177],"combines":[92],"a":[93,98,146,186],"diffusion-based":[94],"difficulty":[95,165],"signal":[96],"with":[97,166],"hierarchical":[99],"semantic":[100,136,139,155,167],"coverage":[101,152],"prior.":[102],"The":[103,138],"diffusion":[104,123],"component":[105,140],"scores":[106],"images":[107],"proposals":[109],"using":[110],"reconstruction":[111],"discrepancy":[112],"denoising":[114],"variability,":[115],"prioritizing":[116],"ambiguous":[120],"examples.":[121],"However,":[122],"alone":[124],"does":[125],"not":[126],"prevent":[127],"repeatedly":[130],"favoring":[131],"hard":[132],"samples":[133,144],"within":[134],"modes.":[137],"therefore":[141],"organizes":[142],"candidate":[143],"three-level":[147],"concept":[148],"graph":[149],"promotes":[151],"underrepresented":[154],"providing":[158],"interpretable":[159],"rationales.":[161],"By":[162],"balancing":[163],"coverage,":[168],"GSAL":[169],"improves":[170],"retrieval":[171,204],"subtle":[173],"rare":[175],"targets":[176],"missed":[180],"by":[181],"uncertainty-only":[182],"selection.":[183],"Experiments":[184],"proprietary":[187],"thin-film":[188],"defect,":[189],"Pascal":[190],"VOC":[191],"MS":[193],"COCO":[194],"dataset":[195],"show":[196],"consistent":[197],"gains":[198],"label":[200],"efficiency":[201],"rare-class":[203],"over":[205],"uncertainty-,":[206],"diversity-,":[207],"hybrid-based":[209],"baselines":[210]},"counts_by_year":[],"updated_date":"2026-04-30T06:05:26.967640","created_date":"2026-04-29T00:00:00"}
