{"id":"https://openalex.org/W4392043723","doi":"https://doi.org/10.1007/s11063-024-11487-2","title":"Text-Vision Relationship Alignment for Referring Image Segmentation","display_name":"Text-Vision Relationship Alignment for Referring Image Segmentation","publication_year":2024,"publication_date":"2024-02-22","ids":{"openalex":"https://openalex.org/W4392043723","doi":"https://doi.org/10.1007/s11063-024-11487-2"},"language":"en","primary_location":{"id":"doi:10.1007/s11063-024-11487-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11063-024-11487-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11063-024-11487-2.pdf","source":{"id":"https://openalex.org/S140962798","display_name":"Neural Processing Letters","issn_l":"1370-4621","issn":["1370-4621","1573-773X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11063-024-11487-2.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108902955","display_name":"Mingxing Pu","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingxing Pu","raw_affiliation_strings":["School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088687781","display_name":"Bing Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bing Luo","raw_affiliation_strings":["School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100460297","display_name":"Chao Zhang","orcid":"https://orcid.org/0009-0007-2579-8783"},"institutions":[{"id":"https://openalex.org/I4210147983","display_name":"Guangdong Police College","ror":"https://ror.org/05krxyw16","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210147983"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chao Zhang","raw_affiliation_strings":["Key Laboratory of Intelligent Policing, Sichuan Police College, Luzhou, 646000, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Intelligent Policing, Sichuan Police College, Luzhou, 646000, China","institution_ids":["https://openalex.org/I4210147983"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101205115","display_name":"Li Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Li Xu","raw_affiliation_strings":["School of Science, Xihua University, Chengdu, 610039, China"],"affiliations":[{"raw_affiliation_string":"School of Science, Xihua University, Chengdu, 610039, China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101308077","display_name":"Fayou Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fayou Xu","raw_affiliation_strings":["School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China","institution_ids":["https://openalex.org/I102345215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089779692","display_name":"Mingming Kong","orcid":"https://orcid.org/0000-0003-2869-5441"},"institutions":[{"id":"https://openalex.org/I102345215","display_name":"Xihua University","ror":"https://ror.org/04gwtvf26","country_code":"CN","type":"education","lineage":["https://openalex.org/I102345215"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mingming Kong","raw_affiliation_strings":["School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Software Engineering, Xihua University, Chengdu, 610039, China","institution_ids":["https://openalex.org/I102345215"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5088687781","https://openalex.org/A5089779692","https://openalex.org/A5100460297","https://openalex.org/A5101205115","https://openalex.org/A5101308077","https://openalex.org/A5108902955"],"corresponding_institution_ids":["https://openalex.org/I102345215","https://openalex.org/I4210147983"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.4893,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.598435,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"56","issue":"2","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computational-intelligence","display_name":"Computational intelligence","score":0.626477062702179},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5924681425094604},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.498882532119751},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4926069378852844},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.48531144857406616},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47693246603012085},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.47330939769744873},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3868541717529297}],"concepts":[{"id":"https://openalex.org/C139502532","wikidata":"https://www.wikidata.org/wiki/Q1122090","display_name":"Computational intelligence","level":2,"score":0.626477062702179},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5924681425094604},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.498882532119751},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4926069378852844},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.48531144857406616},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47693246603012085},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.47330939769744873},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3868541717529297}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11063-024-11487-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11063-024-11487-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11063-024-11487-2.pdf","source":{"id":"https://openalex.org/S140962798","display_name":"Neural Processing Letters","issn_l":"1370-4621","issn":["1370-4621","1573-773X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Processing Letters","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11063-024-11487-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11063-024-11487-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11063-024-11487-2.pdf","source":{"id":"https://openalex.org/S140962798","display_name":"Neural Processing Letters","issn_l":"1370-4621","issn":["1370-4621","1573-773X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Processing Letters","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.46000000834465027}],"awards":[{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6838816535","display_name":null,"funder_award_id":"61801398","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4392043723.pdf"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W2031489346","https://openalex.org/W2064675550","https://openalex.org/W2123442489","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2251512949","https://openalex.org/W2302548814","https://openalex.org/W2412782625","https://openalex.org/W2489434015","https://openalex.org/W2605127024","https://openalex.org/W2798556392","https://openalex.org/W2806070179","https://openalex.org/W2876852810","https://openalex.org/W2894964039","https://openalex.org/W2962739339","https://openalex.org/W2963109634","https://openalex.org/W2963145877","https://openalex.org/W2964345792","https://openalex.org/W2973233205","https://openalex.org/W2980088508","https://openalex.org/W2984121207","https://openalex.org/W3003423830","https://openalex.org/W3023463084","https://openalex.org/W3035097537","https://openalex.org/W3099166112","https://openalex.org/W3108748824","https://openalex.org/W3122412340","https://openalex.org/W3138516171","https://openalex.org/W3153666347","https://openalex.org/W3156800342","https://openalex.org/W3169998662","https://openalex.org/W3172522282","https://openalex.org/W3201770677","https://openalex.org/W3206209177","https://openalex.org/W3216551675","https://openalex.org/W4200631575","https://openalex.org/W4224988000","https://openalex.org/W4225495512","https://openalex.org/W4312438304","https://openalex.org/W4312543911","https://openalex.org/W4312981390","https://openalex.org/W4313023122","https://openalex.org/W6600002382","https://openalex.org/W6600228653","https://openalex.org/W6600756316"],"related_works":["https://openalex.org/W2736674626","https://openalex.org/W2973875853","https://openalex.org/W4379231730","https://openalex.org/W4389858081","https://openalex.org/W4324315429","https://openalex.org/W2501551404","https://openalex.org/W4385583601","https://openalex.org/W4298131179","https://openalex.org/W2113201962","https://openalex.org/W1522196789"],"abstract_inverted_index":{"Abstract":[0],"Referring":[1],"image":[2,10,60,139,190],"segmentation":[3,61,191],"aims":[4],"to":[5,140,163],"segment":[6],"object":[7],"in":[8,19,105],"an":[9,55],"based":[11,29,118],"on":[12,30,74,119,187],"a":[13,106],"referring":[14,59,189],"expression.":[15],"Its":[16],"difficulty":[17],"lies":[18],"aligning":[20,63],"expression":[21,79,85],"semantics":[22],"with":[23,66,159,184],"visual":[24,50,116,147,151,157],"instances.":[25,51],"The":[26,170],"existing":[27],"methods":[28],"semantic":[31],"reasoning":[32],"are":[33],"limited":[34],"by":[35,62,99,180],"the":[36,47,84,100,120,126,138,146,156,160,167,175],"performance":[37,179],"of":[38,137],"external":[39,75],"syntax":[40,76],"parser":[41,77],"and":[42,88,96,122,153],"do":[43],"not":[44,72],"explicitly":[45],"explore":[46],"relationships":[48,148,158,162],"between":[49,149],"This":[52,69],"article":[53],"proposes":[54],"end-to-end":[56],"method":[57,70,177,186],"for":[58,78],"\u2019linguistic":[64,97],"relationship\u2019":[65,98],"\u2019visual":[67],"relationships\u2019.":[68],"does":[71],"rely":[73],"parsing.":[80],"In":[81,124],"this":[82],"paper,":[83],"is":[86],"adaptively":[87],"structurally":[89],"parsed":[90],"into":[91],"three":[92],"components:":[93],"\u2019subject\u2019,":[94],"\u2019object\u2019,":[95],"Semantic":[101],"Component":[102],"Parser":[103],"(SCP)":[104],"learnable":[107],"manner.":[108],"Instances":[109],"Activation":[110],"Map":[111],"Module":[112,131],"(IAM)":[113],"locates":[114],"multiple":[115,188],"instances":[117],"subject":[121],"object.":[123,169],"addition,":[125],"Relationship":[127],"Based":[128],"Visual":[129],"Localization":[130],"(RBVL)":[132],"firstly":[133],"enables":[134],"each":[135],"instance":[136],"learn":[141],"global":[142],"knowledge,":[143],"then":[144],"decodes":[145],"these":[150],"instances,":[152],"finally":[154],"aligns":[155],"linguistic":[161],"further":[164],"accurately":[165],"locate":[166],"target":[168],"experimental":[171],"results":[172],"show":[173],"that":[174],"proposed":[176],"improves":[178],"4\u2013":[181],"9%":[182],"compared":[183],"baseline":[185],"datasets.":[192]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
