{"id":"https://openalex.org/W7162031917","doi":"https://doi.org/10.48550/arxiv.2605.20385","title":"ConceptSeg-R1: Segment Any Concept via Meta-Reinforcement Learning","display_name":"ConceptSeg-R1: Segment Any Concept via Meta-Reinforcement Learning","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7162031917","doi":"https://doi.org/10.48550/arxiv.2605.20385"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.20385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.20385","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136658528","display_name":"Yuan Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Yuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040300820","display_name":"Youwei Pang","orcid":"https://orcid.org/0000-0002-3950-0956"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pang, Youwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104178086","display_name":"Jiaming Zuo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zuo, Jiaming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136667435","display_name":"Wei Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136678738","display_name":"Kailai Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Kailai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136704133","display_name":"Bin Fan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Bin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136625958","display_name":"Yunkang Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yunkang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136671001","display_name":"Lihe Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Lihe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136684252","display_name":"Xiaofeng Liu","orcid":"https://orcid.org/0009-0007-6147-7119"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaofeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136701365","display_name":"Huchuan Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Huchuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136695700","display_name":"Weisi Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Weisi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136673123","display_name":"Dacheng Tao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao, Dacheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136643070","display_name":"Xiaoqi Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xiaoqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.36390000581741333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.36390000581741333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.16140000522136688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.14319999516010284,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8131999969482422},{"id":"https://openalex.org/keywords/market-segmentation","display_name":"Market segmentation","score":0.6553000211715698},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.5332000255584717},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.512499988079071},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4618000090122223},{"id":"https://openalex.org/keywords/concept-learning","display_name":"Concept learning","score":0.387800008058548},{"id":"https://openalex.org/keywords/logical-reasoning","display_name":"Logical reasoning","score":0.37540000677108765},{"id":"https://openalex.org/keywords/proxy","display_name":"Proxy (statistics)","score":0.37220001220703125}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8131999969482422},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6639999747276306},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.6553000211715698},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5625},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.5332000255584717},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.512499988079071},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4618000090122223},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4074999988079071},{"id":"https://openalex.org/C48164120","wikidata":"https://www.wikidata.org/wiki/Q4491893","display_name":"Concept learning","level":2,"score":0.387800008058548},{"id":"https://openalex.org/C43971567","wikidata":"https://www.wikidata.org/wiki/Q3142865","display_name":"Logical reasoning","level":2,"score":0.37540000677108765},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.37220001220703125},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.3601999878883362},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.3537999987602234},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.35010001063346863},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.335999995470047},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.31700000166893005},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2978000044822693},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2802000045776367},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.2605000138282776},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.20385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.20385","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20385","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"progress":[1],"in":[2],"promptable":[3,195],"segmentation":[4,41,81,145,167,196,217],"has":[5],"shifted":[6],"visual":[7,104],"perception":[8],"from":[9,103,218],"object-level":[10,219],"localization":[11],"toward":[12,202,221],"concept-level":[13,222],"understanding.":[14,223],"However,":[15],"the":[16,87,141,185,191],"notion":[17],"of":[18,47,65,89,144,194],"a":[19,43,58,75,94,124,212],"concept":[20,40,80,84,121,126,154,166,187],"remains":[21],"under-specified,":[22],"making":[23],"it":[24],"unclear":[25],"whether":[26],"current":[27],"methods":[28],"truly":[29],"generalize":[30],"beyond":[31],"category":[32],"recognition.":[33],"In":[34],"this":[35,70],"work,":[36],"we":[37,72,156,206],"formalize":[38],"generalized":[39,153],"through":[42,109],"three-level":[44],"taxonomy":[45],"consisting":[46],"context-independent":[48],"(CI),":[49],"context-dependent":[50],"(CD),":[51],"and":[52,106,164,173,178],"context-reasoning":[53],"(CR)":[54],"concepts,":[55],"which":[56],"reveals":[57],"clear":[59],"capability":[60,193],"gap":[61],"across":[62,160,184],"increasing":[63],"levels":[64],"cognitive":[66],"complexity.":[67],"To":[68,150],"address":[69],"challenge,":[71],"propose":[73],"ConceptSeg-R1,":[74],"unified":[76],"framework":[77],"that":[78,98],"reformulates":[79],"as":[82,211],"rule-induced":[83],"grounding.":[85],"At":[86],"core":[88],"our":[90],"method":[91],"is":[92],"Meta-GRPO,":[93],"meta-reinforcement":[95],"learning":[96],"mechanism":[97],"learns":[99],"transferable":[100],"task":[101],"rules":[102],"demonstrations":[105],"verifies":[107],"them":[108],"proxy":[110],"reasoning.":[111],"The":[112],"inferred":[113],"reasoning":[114],"states":[115],"are":[116],"then":[117],"translated":[118],"into":[119],"segmentation-ready":[120],"prompts":[122],"via":[123],"lightweight":[125],"translation":[127],"module,":[128],"enabling":[129],"deductive":[130],"application":[131],"to":[132],"target":[133],"images.":[134],"A":[135],"shortcut":[136],"routing":[137],"strategy":[138],"further":[139],"preserves":[140],"native":[142,192],"efficiency":[143],"models":[146],"on":[147],"simple":[148],"cases.":[149],"systematically":[151],"evaluate":[152],"segmentation,":[155],"conduct":[157],"extensive":[158],"experiments":[159],"diverse":[161],"CI,":[162],"CD,":[163],"CR":[165],"benchmarks":[168],"spanning":[169],"natural,":[170],"industrial,":[171],"medical":[172],"reasoning-intensive":[174],"domains.":[175],"Without":[176],"bells":[177],"whistles,":[179],"ConceptSeg-R1":[180,208],"achieves":[181],"strong":[182],"performance":[183],"full":[186],"hierarchy":[188],"while":[189],"maintaining":[190],"backbones.":[197],"As":[198],"an":[199],"initial":[200],"step":[201],"segmenting":[203],"any":[204],"concept,":[205],"hope":[207],"can":[209],"serve":[210],"practical":[213],"baseline":[214],"for":[215],"advancing":[216],"prediction":[220]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-22T00:00:00"}
