{"id":"https://openalex.org/W4410187692","doi":"https://doi.org/10.1007/s40747-025-01900-1","title":"Parameter-efficient weakly supervised referring video object segmentation via chain-of-thought reasoning","display_name":"Parameter-efficient weakly supervised referring video object segmentation via chain-of-thought reasoning","publication_year":2025,"publication_date":"2025-05-08","ids":{"openalex":"https://openalex.org/W4410187692","doi":"https://doi.org/10.1007/s40747-025-01900-1"},"language":"en","primary_location":{"id":"doi:10.1007/s40747-025-01900-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-025-01900-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-025-01900-1.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1007/s40747-025-01900-1.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011643677","display_name":"Xing Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xing Wang","raw_affiliation_strings":["School of Mechano Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China"],"affiliations":[{"raw_affiliation_string":"School of Mechano Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016155663","display_name":"Zhe Xu","orcid":"https://orcid.org/0000-0001-6898-3443"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhe Xu","raw_affiliation_strings":["School of Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011899531","display_name":"Yuanshi Zheng","orcid":"https://orcid.org/0000-0002-1143-2509"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanshi Zheng","raw_affiliation_strings":["School of Mechano Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China"],"affiliations":[{"raw_affiliation_string":"School of Mechano Electronic Engineering, Xidian University, Xi\u2019an, Shaanxi, 710071, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091324372","display_name":"Handing Wang","orcid":"https://orcid.org/0000-0002-4805-3780"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Handing Wang","raw_affiliation_strings":["School of Artificial Intelligence, Xidian University, Xi\u2019an, Shaanxi, 710071, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Xidian University, Xi\u2019an, Shaanxi, 710071, China","institution_ids":["https://openalex.org/I149594827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5011643677"],"corresponding_institution_ids":["https://openalex.org/I149594827"],"apc_list":{"value":1320,"currency":"GBP","value_usd":1619},"apc_paid":{"value":1320,"currency":"GBP","value_usd":1619},"fwci":2.66,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.89593484,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":"11","issue":"6","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computational-intelligence","display_name":"Computational intelligence","score":0.6748838424682617},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.6723300218582153},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6357177495956421},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6123035550117493},{"id":"https://openalex.org/keywords/chain","display_name":"Chain (unit)","score":0.5524612069129944},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.541883111000061},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46235689520835876},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41118359565734863},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3742891550064087},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06839486956596375}],"concepts":[{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.6748838424682617},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.6723300218582153},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6357177495956421},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6123035550117493},{"id":"https://openalex.org/C199185054","wikidata":"https://www.wikidata.org/wiki/Q552299","display_name":"Chain (unit)","level":2,"score":0.5524612069129944},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.541883111000061},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46235689520835876},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41118359565734863},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3742891550064087},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06839486956596375},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/s40747-025-01900-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-025-01900-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-025-01900-1.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:4dc72fd8d8b24b0892cc7ea8be6a897b","is_oa":true,"landing_page_url":"https://doaj.org/article/4dc72fd8d8b24b0892cc7ea8be6a897b","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Complex & Intelligent Systems, Vol 11, Iss 6, Pp 1-12 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/s40747-025-01900-1","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s40747-025-01900-1","pdf_url":"https://link.springer.com/content/pdf/10.1007/s40747-025-01900-1.pdf","source":{"id":"https://openalex.org/S3035462843","display_name":"Complex & Intelligent Systems","issn_l":"2198-6053","issn":["2198-6053","2199-4536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Complex &amp; Intelligent Systems","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.4399999976158142,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4410187692.pdf","grobid_xml":"https://content.openalex.org/works/W4410187692.grobid-xml"},"referenced_works_count":66,"referenced_works":["https://openalex.org/W611457968","https://openalex.org/W2034014085","https://openalex.org/W2143331230","https://openalex.org/W2302548814","https://openalex.org/W2552414813","https://openalex.org/W2610147486","https://openalex.org/W2804867909","https://openalex.org/W2866912866","https://openalex.org/W2889658408","https://openalex.org/W2921536280","https://openalex.org/W2962758679","https://openalex.org/W2962945654","https://openalex.org/W2963253279","https://openalex.org/W2963354481","https://openalex.org/W2963524571","https://openalex.org/W2970476646","https://openalex.org/W2982651953","https://openalex.org/W2983693499","https://openalex.org/W2990205821","https://openalex.org/W3034804856","https://openalex.org/W3096609285","https://openalex.org/W3138516171","https://openalex.org/W3153427360","https://openalex.org/W3166738350","https://openalex.org/W3166986030","https://openalex.org/W3173777717","https://openalex.org/W3173788106","https://openalex.org/W3177892185","https://openalex.org/W3198377975","https://openalex.org/W3215899623","https://openalex.org/W4205991051","https://openalex.org/W4221143046","https://openalex.org/W4225495512","https://openalex.org/W4226024706","https://openalex.org/W4285729260","https://openalex.org/W4289639375","https://openalex.org/W4295046616","https://openalex.org/W4312310776","https://openalex.org/W4312438304","https://openalex.org/W4312560592","https://openalex.org/W4312651322","https://openalex.org/W4312690830","https://openalex.org/W4312815172","https://openalex.org/W4312884055","https://openalex.org/W4380763492","https://openalex.org/W4387398391","https://openalex.org/W4390577884","https://openalex.org/W4390872868","https://openalex.org/W4390874496","https://openalex.org/W4392516357","https://openalex.org/W4397024153","https://openalex.org/W4398200794","https://openalex.org/W4401328210","https://openalex.org/W4402684026","https://openalex.org/W4402727770","https://openalex.org/W4402754173","https://openalex.org/W4404601423","https://openalex.org/W4404769790","https://openalex.org/W6600005967","https://openalex.org/W6600299915","https://openalex.org/W6600336842","https://openalex.org/W6600445788","https://openalex.org/W6600577311","https://openalex.org/W6605686645","https://openalex.org/W6630827713","https://openalex.org/W6702248584"],"related_works":["https://openalex.org/W2736674626","https://openalex.org/W2973875853","https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W2737719445","https://openalex.org/W2898210368","https://openalex.org/W4239098401","https://openalex.org/W2501551404","https://openalex.org/W4298131179","https://openalex.org/W2113201962"],"abstract_inverted_index":{"Referring":[0],"video":[1,118,138],"object":[2,9,119],"segmentation":[3,45,84,109],"(RVOS)":[4],"aims":[5],"to":[6,11,33,38,50,71,79,115,147],"segment":[7,116],"the":[8,40,53,100,112,117,127,137,149,153,161],"corresponding":[10],"a":[12,16,44,62,90,106,122],"language":[13,123,141],"expression":[14],"in":[15],"video.":[17],"Most":[18],"existing":[19],"RVOS":[20,87],"methods":[21,173],"are":[22,29],"trained":[23,94],"using":[24],"accurate":[25],"per-pixel":[26],"annotations,":[27],"which":[28],"expensive":[30],"and":[31,139,179],"time-consuming":[32],"obtain.":[34],"Moreover,":[35],"they":[36],"need":[37],"update":[39,126],"entire":[41],"parameter":[42],"of":[43,74,93,134,165],"model,":[46],"making":[47],"it":[48],"inefficient":[49],"train":[51],"as":[52],"model":[54,85,110],"scale":[55],"increases.":[56],"In":[57],"this":[58],"paper,":[59],"we":[60,77,143],"propose":[61,78,144],"novel":[63],"parameter-efficient":[64],"framework":[65],"under":[66,130],"weak":[67,131],"supervision,":[68,132],"dubbed":[69],"ReferringAdapter,":[70],"ameliorate":[72],"both":[73],"issues.":[75],"Specifically,":[76],"adapt":[80],"an":[81,97],"off-the-shelf":[82],"image":[83,108],"for":[86],"by":[88,121,174],"plugging":[89],"small":[91],"set":[92],"parameters,":[95],"i.e.,":[96],"adapter,":[98],"into":[99],"intermediate":[101,150],"layer.":[102],"This":[103],"efficiently":[104],"endows":[105],"uni-modal":[107],"with":[111,163,183],"cross-modal":[113],"ability":[114],"referred":[120],"expression.":[124],"To":[125],"adapter":[128,162],"parameters":[129,167],"instead":[133],"directly":[135],"fuse":[136],"sentence-level":[140],"features,":[142],"chain-of-thought":[145],"reasoning":[146],"consider":[148],"steps":[151],"along":[152],"thought":[154],"process.":[155],"Extensive":[156],"experiments":[157],"demonstrate":[158],"that":[159],"training":[160],"1.1%":[164],"total":[166],"can":[168],"outperform":[169],"previous":[170],"weakly":[171],"supervised":[172,185],"11.6":[175],"$$-$$":[176],"15.3":[177],"mAP":[178],"achieve":[180],"comparable":[181],"performance":[182],"fully":[184],"ones.":[186]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
