{"id":"https://openalex.org/W7138218695","doi":"https://doi.org/10.48550/arxiv.2603.14382","title":"StAR: Segment Anything Reasoner","display_name":"StAR: Segment Anything Reasoner","publication_year":2026,"publication_date":"2026-03-15","ids":{"openalex":"https://openalex.org/W7138218695","doi":"https://doi.org/10.48550/arxiv.2603.14382"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.14382","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14382","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.14382","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129653133","display_name":"Seokju Yun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yun, Seokju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099042218","display_name":"Dongheon Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Dongheon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129683926","display_name":"Noori Bae","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bae, Noori","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013059423","display_name":"Jaesung Jun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jun, Jaesung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129722596","display_name":"Chanseul Cho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cho, Chanseul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5099042219","display_name":"Youngmin Ro","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ro, Youngmin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9629999995231628,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9629999995231628,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.009200000204145908,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.0052999998442828655,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantic-reasoner","display_name":"Semantic reasoner","score":0.9455000162124634},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.4699999988079071},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.3971000015735626},{"id":"https://openalex.org/keywords/scope","display_name":"Scope (computer science)","score":0.3804999887943268},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.3779999911785126},{"id":"https://openalex.org/keywords/reasoning-system","display_name":"Reasoning system","score":0.3718000054359436},{"id":"https://openalex.org/keywords/qualitative-reasoning","display_name":"Qualitative reasoning","score":0.36559998989105225},{"id":"https://openalex.org/keywords/abductive-reasoning","display_name":"Abductive reasoning","score":0.36390000581741333},{"id":"https://openalex.org/keywords/spatial-intelligence","display_name":"Spatial intelligence","score":0.36230000853538513}],"concepts":[{"id":"https://openalex.org/C9616225","wikidata":"https://www.wikidata.org/wiki/Q3929429","display_name":"Semantic reasoner","level":2,"score":0.9455000162124634},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.725600004196167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6344000101089478},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.4699999988079071},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.3971000015735626},{"id":"https://openalex.org/C2778012447","wikidata":"https://www.wikidata.org/wiki/Q1034415","display_name":"Scope (computer science)","level":2,"score":0.3804999887943268},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3779999911785126},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.3718000054359436},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.36559998989105225},{"id":"https://openalex.org/C166088908","wikidata":"https://www.wikidata.org/wiki/Q308495","display_name":"Abductive reasoning","level":2,"score":0.36390000581741333},{"id":"https://openalex.org/C155911833","wikidata":"https://www.wikidata.org/wiki/Q3817354","display_name":"Spatial intelligence","level":2,"score":0.36230000853538513},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.3621000051498413},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.3402999937534332},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.3310999870300293},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32749998569488525},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.3228999972343445},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.3107999861240387},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2815999984741211},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.2766999900341034},{"id":"https://openalex.org/C86827895","wikidata":"https://www.wikidata.org/wiki/Q7098582","display_name":"Opportunistic reasoning","level":4,"score":0.26829999685287476},{"id":"https://openalex.org/C43971567","wikidata":"https://www.wikidata.org/wiki/Q3142865","display_name":"Logical reasoning","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.25760000944137573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.14382","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14382","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.14382","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14382","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"AI":[1],"systems":[2],"are":[3],"being":[4],"integrated":[5],"more":[6],"rapidly":[7],"into":[8],"diverse":[9],"and":[10,24,78,113,131,157],"complex":[11],"real-world":[12],"environments,":[13],"the":[14,44,49,66,90,100,104,111,124,151,195],"ability":[15],"to":[16,27,41,99,149,194],"perform":[17],"holistic":[18],"reasoning":[19,37,46,116,129,155,192],"over":[20,84,178],"an":[21,25],"implicit":[22],"query":[23],"image":[26],"localize":[28],"a":[29,61,145,159],"target":[30],"is":[31],"becoming":[32],"increasingly":[33],"important.":[34],"However,":[35],"recent":[36,85],"segmentation":[38,101],"methods":[39],"fail":[40],"sufficiently":[42],"elicit":[43],"visual":[45],"capabilities":[47],"of":[48,115,166],"base":[50,152,180],"mode.":[51],"In":[52,87],"this":[53,139],"work,":[54],"we":[55,93,121,141],"present":[56],"Segment":[57],"Anything":[58],"Reasoner":[59],"(StAR),":[60],"comprehensive":[62],"framework":[63],"that":[64,134,186],"refines":[65],"design":[67],"space":[68],"from":[69],"multiple":[70],"perspectives-including":[71],"parameter-tuning":[72],"scheme,":[73],"reward":[74],"functions,":[75],"learning":[76],"strategies":[77],"answer":[79],"format-and":[80],"achieves":[81,175],"substantial":[82],"improvements":[83],"baselines.":[86],"addition,":[88],"for":[89,162],"first":[91],"time,":[92],"successfully":[94],"introduce":[95],"parallel":[96],"test-time":[97],"scaling":[98],"task,":[102],"pushing":[103],"performance":[105],"boundary":[106],"even":[107],"further.":[108],"To":[109],"extend":[110],"scope":[112],"depth":[114],"covered":[117],"by":[118],"existing":[119],"benchmark,":[120],"also":[122],"construct":[123],"ReasonSeg-X,":[125],"which":[126],"compactly":[127],"defines":[128],"types":[130],"includes":[132],"samples":[133],"require":[135],"deeper":[136],"reasoning.":[137],"Leveraging":[138],"dataset,":[140],"train":[142],"StAR":[143,174],"with":[144],"rollout-expanded":[146],"selective-tuning":[147],"approach":[148],"activate":[150],"model's":[153],"latent":[154],"capabilities,":[156],"establish":[158],"rigorous":[160],"benchmark":[161],"systematic,":[163],"fine-grained":[164],"evaluation":[165],"advanced":[167],"methods.":[168],"With":[169],"only":[170],"5k":[171],"training":[172],"samples,":[173],"significant":[176],"gains":[177],"its":[179],"counterparts":[181],"across":[182],"extensive":[183],"benchmarks,":[184],"demonstrating":[185],"our":[187],"method":[188],"effectively":[189],"brings":[190],"dormant":[191],"competence":[193],"surface.":[196]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-18T00:00:00"}
