{"id":"https://openalex.org/W3206209177","doi":"https://doi.org/10.1145/3474085.3475222","title":"Two-stage Visual Cues Enhancement Network for Referring Image Segmentation","display_name":"Two-stage Visual Cues Enhancement Network for Referring Image Segmentation","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3206209177","doi":"https://doi.org/10.1145/3474085.3475222","mag":"3206209177"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475222","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475222","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010965630","display_name":"Yang Jiao","orcid":"https://orcid.org/0000-0002-6390-2517"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Jiao","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075329194","display_name":"Zequn Jie","orcid":"https://orcid.org/0000-0002-3038-5891"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zequn Jie","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013605789","display_name":"Weixin Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weixin Luo","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100373492","display_name":"Jingjing Chen","orcid":"https://orcid.org/0000-0003-3148-264X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingjing Chen","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047962986","display_name":"Yu\u2013Gang Jiang","orcid":"https://orcid.org/0000-0002-1907-8567"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Gang Jiang","raw_affiliation_strings":["Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009222019","display_name":"Xiaolin Wei","orcid":"https://orcid.org/0000-0002-3983-047X"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolin Wei","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017116858","display_name":"Lin Ma","orcid":"https://orcid.org/0000-0002-7331-6132"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Ma","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5010965630"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":2.0174,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.88792484,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1331","last_page":"1340"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.758673906326294},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6990865468978882},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6140444278717041},{"id":"https://openalex.org/keywords/sensory-cue","display_name":"Sensory cue","score":0.5802468061447144},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5572959780693054},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5273333787918091},{"id":"https://openalex.org/keywords/referent","display_name":"Referent","score":0.5104891061782837},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4738624095916748},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42203468084335327},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09509235620498657}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.758673906326294},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6990865468978882},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6140444278717041},{"id":"https://openalex.org/C111370547","wikidata":"https://www.wikidata.org/wiki/Q7451120","display_name":"Sensory cue","level":2,"score":0.5802468061447144},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5572959780693054},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5273333787918091},{"id":"https://openalex.org/C2777096784","wikidata":"https://www.wikidata.org/wiki/Q3826351","display_name":"Referent","level":2,"score":0.5104891061782837},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4738624095916748},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42203468084335327},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09509235620498657},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3474085.3475222","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475222","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7599999904632568,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W2006147162","https://openalex.org/W2031489346","https://openalex.org/W2108598243","https://openalex.org/W2250539671","https://openalex.org/W2250861254","https://openalex.org/W2302548814","https://openalex.org/W2412782625","https://openalex.org/W2546696630","https://openalex.org/W2605127024","https://openalex.org/W2747329762","https://openalex.org/W2798556392","https://openalex.org/W2799142693","https://openalex.org/W2876852810","https://openalex.org/W2894964039","https://openalex.org/W2955058313","https://openalex.org/W2963091558","https://openalex.org/W2963109634","https://openalex.org/W2963244312","https://openalex.org/W2963857746","https://openalex.org/W2980088508","https://openalex.org/W2981689412","https://openalex.org/W3004019157","https://openalex.org/W3034325957","https://openalex.org/W3034692043","https://openalex.org/W3035733952","https://openalex.org/W3093122931"],"related_works":["https://openalex.org/W2143938773","https://openalex.org/W2366781357","https://openalex.org/W2493878481","https://openalex.org/W1968508462","https://openalex.org/W2167817468","https://openalex.org/W2087916438","https://openalex.org/W4231483347","https://openalex.org/W3010781847","https://openalex.org/W2019550078","https://openalex.org/W4318215341"],"abstract_inverted_index":{"Referring":[0],"Image":[1],"Segmentation":[2],"(RIS)":[3],"aims":[4],"at":[5,90],"segmenting":[6],"the":[7,30,33,65,76,99,102,112,133,137,169,182,190,194,197,208,214,223,226,241,249,253,268,271,275,283],"target":[8],"object":[9],"from":[10,127,173,218],"an":[11,157,174],"image":[12,172,199],"referred":[13,71],"by":[14,87,95,111,139,212],"one":[15],"given":[16],"natural":[17,242],"language":[18,243],"expression.":[19],"The":[20],"diverse":[21],"and":[22,25,48,62,152,156,184,187,245],"flexible":[23],"expressions":[24,47],"complex":[26],"visual":[27,66,80,104,134,183,191,209,250],"contents":[28],"in":[29,46,51,98,118,235],"images":[31],"raise":[32],"RIS":[34,276],"model":[35],"with":[36,178,196,278],"higher":[37],"demands":[38],"for":[39,136,200],"investigating":[40],"fine-grained":[41,237],"matching":[42,55,238],"behaviors":[43,56,239],"between":[44,240],"words":[45],"objects":[49,97],"presented":[50],"images.":[52],"However,":[53],"such":[54],"are":[57,73,164,264],"hard":[58],"to":[59,83,180,266],"be":[60,84,109],"learned":[61],"captured":[63],"when":[64,248],"cues":[67,81,105,144],"of":[68,78,131,193,222,252,270],"referents":[69,77,138],"(i.e.":[70],"objects)":[72],"insufficient,":[74],"as":[75,116],"weak":[79],"tend":[82],"easily":[85],"confused":[86],"cluttered":[88],"background":[89],"boundary":[91],"or":[92],"even":[93],"overwhelmed":[94],"salient":[96],"image.":[100,224],"And":[101],"insufficient":[103],"issue":[106],"can":[107],"not":[108],"handled":[110],"cross-modal":[113],"fusion":[114],"mechanisms":[115],"done":[117],"previous":[119],"work.In":[120],"this":[121,125],"paper,":[122],"we":[123],"tackle":[124],"problem":[126],"a":[128,141,149],"novel":[129,150],"perspective":[130],"enhancing":[132],"information":[135,192,211,251],"devising":[140],"Two-stage":[142],"Visual":[143],"enhancement":[145],"Network":[146],"(TV-Net),":[147],"where":[148],"Retrieval":[151],"Enrichment":[153],"Scheme":[154],"(RES)":[155],"Adaptive":[158],"Multi-resolution":[159],"feature":[160,203,216],"Fusion":[161],"(AMF)":[162],"module":[163],"proposed.":[165],"Specifically,":[166],"RES":[167],"retrieves":[168],"most":[170],"relevant":[171],"external":[175],"data":[176],"pool":[177],"regard":[179],"both":[181],"textual":[185],"similarities,":[186],"then":[188],"enriches":[189],"referent":[195,254],"retrieved":[198],"better":[201,233,259],"multimodal":[202],"learning.":[204],"AMF":[205],"further":[206],"enhances":[207],"detailed":[210],"incorporating":[213],"high-resolution":[215],"maps":[217],"lower":[219],"convolution":[220],"layers":[221],"Through":[225],"two-stage":[227],"enhancement,":[228],"our":[229,279],"proposed":[230,272,280],"TV-Net":[231,281],"enjoys":[232],"performances":[234],"learning":[236],"expression":[244],"image,":[246],"especially":[247],"is":[255],"inadequate,":[256],"thus":[257],"produces":[258],"segmentation":[260],"results.":[261],"Extensive":[262],"experiments":[263],"conducted":[265],"validate":[267],"effectiveness":[269],"method":[273],"on":[274,286],"task,":[277],"surpassing":[282],"state-of-the-art":[284],"approaches":[285],"four":[287],"benchmark":[288],"datasets.":[289]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
