{"id":"https://openalex.org/W3178075329","doi":"https://doi.org/10.1109/tpami.2021.3079993","title":"Cross-Modal Progressive Comprehension for Referring Segmentation","display_name":"Cross-Modal Progressive Comprehension for Referring Segmentation","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3178075329","doi":"https://doi.org/10.1109/tpami.2021.3079993","mag":"3178075329","pmid":"https://pubmed.ncbi.nlm.nih.gov/33983880"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2021.3079993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3079993","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100330138","display_name":"Si Liu","orcid":"https://orcid.org/0000-0002-9180-2935"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Si Liu","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, beijing, China, (e-mail: liusi@buaa.edu.cn)"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, beijing, China, (e-mail: liusi@buaa.edu.cn)","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056811650","display_name":"Tianrui Hui","orcid":"https://orcid.org/0000-0002-1172-1554"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianrui Hui","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, 12381 Beijing, Beijing, China, (e-mail: huitianrui@iie.ac.cn)"],"affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, 12381 Beijing, Beijing, China, (e-mail: huitianrui@iie.ac.cn)","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024226895","display_name":"Shaofei Huang","orcid":"https://orcid.org/0000-0001-8996-9907"},"institutions":[{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaofei Huang","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, 12381 Beijing, Beijing, China, (e-mail: huangshaofei@iie.ac.cn)"],"affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, 12381 Beijing, Beijing, China, (e-mail: huangshaofei@iie.ac.cn)","institution_ids":["https://openalex.org/I4210156404"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087043856","display_name":"Yunchao Wei","orcid":"https://orcid.org/0000-0002-2812-8781"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yunchao Wei","raw_affiliation_strings":["Centre for Artificial Intelligence, University of Technology Sydney, 1994 Sydney, New South Wales, Australia, (e-mail: Yunchao.Wei@uts.edu.au)"],"affiliations":[{"raw_affiliation_string":"Centre for Artificial Intelligence, University of Technology Sydney, 1994 Sydney, New South Wales, Australia, (e-mail: Yunchao.Wei@uts.edu.au)","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100374360","display_name":"Bo Li","orcid":"https://orcid.org/0000-0001-6709-0942"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Li","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, 12633 Beijing, Beijing, China, (e-mail: boli@buaa.edu.cn)"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, 12633 Beijing, Beijing, China, (e-mail: boli@buaa.edu.cn)","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I82880672"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042965510","display_name":"Guanbin Li","orcid":"https://orcid.org/0000-0002-4805-0926"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guanbin Li","raw_affiliation_strings":["School of Data and Computer Science, Sun Yat-Sen University, 26469 Guangzhou, Guangdong, China, 510006 (e-mail: liguanbin@mail.sysu.edu.cn)"],"affiliations":[{"raw_affiliation_string":"School of Data and Computer Science, Sun Yat-Sen University, 26469 Guangzhou, Guangdong, China, 510006 (e-mail: liguanbin@mail.sysu.edu.cn)","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100330138"],"corresponding_institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":8.936,"has_fulltext":false,"cited_by_count":125,"citation_normalized_percentile":{"value":0.98522303,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"44","issue":"9","first_page":"1","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9879999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7360479831695557},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5544954538345337},{"id":"https://openalex.org/keywords/expression","display_name":"Expression (computer science)","score":0.5225067734718323},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5034295916557312},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.49734166264533997},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.47747159004211426},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.473099023103714},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.41086384654045105},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4062032401561737},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3498578369617462},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.11523625254631042}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7360479831695557},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5544954538345337},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.5225067734718323},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5034295916557312},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.49734166264533997},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.47747159004211426},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.473099023103714},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.41086384654045105},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4062032401561737},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3498578369617462},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.11523625254631042},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D032882","descriptor_name":"Comprehension","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D032882","descriptor_name":"Comprehension","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D032882","descriptor_name":"Comprehension","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2021.3079993","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2021.3079993","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:33983880","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/33983880","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G7834498664","display_name":null,"funder_award_id":"61876177","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W1485009520","https://openalex.org/W1522301498","https://openalex.org/W1861492603","https://openalex.org/W1903029394","https://openalex.org/W1905722737","https://openalex.org/W1923697677","https://openalex.org/W2006147162","https://openalex.org/W2020755048","https://openalex.org/W2031489346","https://openalex.org/W2034014085","https://openalex.org/W2064675550","https://openalex.org/W2161236525","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2251512949","https://openalex.org/W2302548814","https://openalex.org/W2412782625","https://openalex.org/W2489434015","https://openalex.org/W2560023338","https://openalex.org/W2605127024","https://openalex.org/W2619947201","https://openalex.org/W2630837129","https://openalex.org/W2747053578","https://openalex.org/W2776638780","https://openalex.org/W2798556392","https://openalex.org/W2806331055","https://openalex.org/W2876852810","https://openalex.org/W2889986507","https://openalex.org/W2894964039","https://openalex.org/W2947128531","https://openalex.org/W2955058313","https://openalex.org/W2955813853","https://openalex.org/W2960655175","https://openalex.org/W2962744691","https://openalex.org/W2963091558","https://openalex.org/W2963109634","https://openalex.org/W2963145877","https://openalex.org/W2963150697","https://openalex.org/W2963319519","https://openalex.org/W2963354481","https://openalex.org/W2963524571","https://openalex.org/W2963717374","https://openalex.org/W2964015378","https://openalex.org/W2964345792","https://openalex.org/W2964935470","https://openalex.org/W2973233205","https://openalex.org/W2980088508","https://openalex.org/W2983693499","https://openalex.org/W2986755220","https://openalex.org/W2998631105","https://openalex.org/W3003423830","https://openalex.org/W3004019157","https://openalex.org/W3006154882","https://openalex.org/W3020827971","https://openalex.org/W3034325957","https://openalex.org/W3034772468","https://openalex.org/W3034777757","https://openalex.org/W3035268124","https://openalex.org/W3099166112","https://openalex.org/W3104844437","https://openalex.org/W6631190155","https://openalex.org/W6640295612","https://openalex.org/W6726873649","https://openalex.org/W6739696289","https://openalex.org/W6754309021","https://openalex.org/W6755002340","https://openalex.org/W6763197473","https://openalex.org/W6767362881","https://openalex.org/W6768730002","https://openalex.org/W6955071965"],"related_works":["https://openalex.org/W2517104666","https://openalex.org/W2005437358","https://openalex.org/W1669643531","https://openalex.org/W2008656436","https://openalex.org/W2134924024","https://openalex.org/W2023558673","https://openalex.org/W2110230079","https://openalex.org/W1982826852","https://openalex.org/W2613186388","https://openalex.org/W1967061043"],"abstract_inverted_index":{"Given":[0],"a":[1,46,58,85,100,105,199],"natural":[2],"language":[3],"expression":[4],"and":[5,38,42,74,96,104,113,126,238,263,276],"an":[6],"image/video,":[7],"the":[8,16,20,24,27,54,66,77,132,140,143,150,179,184,194,210,219,223,244],"goal":[9],"of":[10,19,26,225],"referring":[11,55,111,260,272,278],"segmentation":[12,115,261,274,280],"is":[13,285],"to":[14,52,91,109,129,148,177,193,208,215],"produce":[15],"pixel-level":[17],"masks":[18],"entities":[21,73,134],"described":[22],"by":[23,34,139,160,187],"subject":[25],"expression.":[28,141],"Previous":[29],"approaches":[30],"tackle":[31],"this":[32,81,229],"problem":[33,56],"implicit":[35],"feature":[36],"interaction":[37],"fusion":[39],"between":[40],"visual":[41,220],"linguistic":[43],"modalities":[44],"in":[45,57,65,218],"one-stage":[47],"manner.":[48],"However,":[49],"human":[50,94],"tends":[51],"solve":[53],"progressive":[59,87],"manner":[60],"based":[61,174,242],"on":[62,175,243,270],"informative":[63],"words":[64,128,145,173],"expression,":[67],"i.e.,":[68],"first":[69,123],"roughly":[70],"locating":[71],"candidate":[72],"then":[75],"distinguishing":[76],"target":[78,151],"one.":[79],"In":[80,191,228],"paper,":[82],"we":[83,196],"propose":[84],"cross-modal":[86],"comprehension":[88],"(CMPC)":[89],"scheme":[90],"effectively":[92],"mimic":[93],"behaviors":[95],"implement":[97],"it":[98],"as":[99,153,155],"CMPC-I":[101,121,176,248],"(Image)":[102],"module":[103,108,122,169,207],"CMPC-V":[106,168,250],"(Video)":[107],"improve":[110],"image":[112,118,256,273],"video":[114,165,258,279],"models.":[116],"For":[117,164],"data,":[119,166],"our":[120,167,255,264],"employs":[124],"entity":[125,152,181],"attribute":[127],"perceive":[130],"all":[131],"related":[133],"that":[135],"might":[136],"be":[137,239],"considered":[138],"Then,":[142],"relational":[144],"are":[146],"adopted":[147],"highlight":[149,178],"well":[154],"suppress":[156],"other":[157,237],"irrelevant":[158],"ones":[159],"spatial":[161],"graph":[162,189],"reasoning.":[163,190],"further":[170],"exploits":[171],"action":[172,185],"correct":[180],"matched":[182],"with":[183,235,251],"cues":[186],"temporal":[188],"addition":[192],"CMPC,":[195],"also":[197],"introduce":[198],"simple":[200],"yet":[201],"effective":[202],"Text-Guided":[203],"Feature":[204],"Exchange":[205],"(TGFE)":[206],"integrate":[209],"reasoned":[211],"multimodal":[212],"features":[213,232],"corresponding":[214],"different":[216],"levels":[217],"backbone":[221],"under":[222],"guidance":[224],"textual":[226,245],"information.":[227],"way,":[230],"multi-level":[231],"can":[233,253],"communicate":[234],"each":[236],"mutually":[240],"refined":[241],"context.":[246],"Combining":[247],"or":[249,257],"TGFE":[252],"form":[254],"version":[259],"frameworks":[262,265],"achieve":[266],"new":[267],"state-of-the-art":[268],"performances":[269],"four":[271],"benchmarks":[275,281],"three":[277],"respectively.":[282],"Our":[283],"code":[284],"available":[286],"at":[287],"https://github.com/spyflying/CMPC-Refseg.":[288]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":29},{"year":2024,"cited_by_count":35},{"year":2023,"cited_by_count":40},{"year":2022,"cited_by_count":15},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
