{"id":"https://openalex.org/W4389665127","doi":"https://doi.org/10.1109/tmm.2023.3342718","title":"Region-Enhanced Feature Learning for Scene Semantic Segmentation","display_name":"Region-Enhanced Feature Learning for Scene Semantic Segmentation","publication_year":2023,"publication_date":"2023-12-13","ids":{"openalex":"https://openalex.org/W4389665127","doi":"https://doi.org/10.1109/tmm.2023.3342718"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3342718","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3342718","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116517434","display_name":"Xin Kang","orcid":"https://orcid.org/0000-0002-9975-4341"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Kang","raw_affiliation_strings":["National Engineering Laboratory for Brain-inspired Intelligence Technology and Application, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Laboratory for Brain-inspired Intelligence Technology and Application, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115594845","display_name":"Chaoqun Wang","orcid":"https://orcid.org/0000-0002-4649-5518"},"institutions":[{"id":"https://openalex.org/I187400657","display_name":"South China Normal University","ror":"https://ror.org/01kq0pv72","country_code":"CN","type":"education","lineage":["https://openalex.org/I187400657"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chaoqun Wang","raw_affiliation_strings":["South China Normal University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"South China Normal University, Guangzhou, China","institution_ids":["https://openalex.org/I187400657"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088031350","display_name":"Xuejin Chen","orcid":"https://orcid.org/0000-0003-0478-7018"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuejin Chen","raw_affiliation_strings":["National Engineering Laboratory for Brain-inspired Intelligence Technology and Application, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Laboratory for Brain-inspired Intelligence Technology and Application, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5116517434"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":1.5157,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.80257063,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"27","issue":null,"first_page":"954","last_page":"964"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11211","display_name":"3D Surveying and Cultural Heritage","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1907","display_name":"Geology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8399039506912231},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6631014347076416},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6431734561920166},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.6071098446846008},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5832393169403076},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5386592745780945},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5172355771064758},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.46595650911331177},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.44339025020599365},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43318843841552734},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.43085533380508423},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4216083288192749}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8399039506912231},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6631014347076416},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6431734561920166},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.6071098446846008},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5832393169403076},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5386592745780945},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5172355771064758},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.46595650911331177},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.44339025020599365},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43318843841552734},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.43085533380508423},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4216083288192749},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3342718","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3342718","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4000000059604645,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G42091576","display_name":null,"funder_award_id":"62076230","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G540665834","display_name":null,"funder_award_id":"WK3490000008","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320333993","display_name":"Microsoft Research Asia","ror":"https://ror.org/0300m5276"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W2131396337","https://openalex.org/W2135249503","https://openalex.org/W2160821342","https://openalex.org/W2460657278","https://openalex.org/W2594519801","https://openalex.org/W2620650400","https://openalex.org/W2624273542","https://openalex.org/W2737234477","https://openalex.org/W2804872164","https://openalex.org/W2955873422","https://openalex.org/W2963125977","https://openalex.org/W2963182550","https://openalex.org/W2963231572","https://openalex.org/W2963281829","https://openalex.org/W2979750740","https://openalex.org/W2990613095","https://openalex.org/W2991216808","https://openalex.org/W3012494314","https://openalex.org/W3034239841","https://openalex.org/W3034591723","https://openalex.org/W3043238202","https://openalex.org/W3089444959","https://openalex.org/W3104141662","https://openalex.org/W3107518100","https://openalex.org/W3111535274","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3153465022","https://openalex.org/W3168037706","https://openalex.org/W3171433839","https://openalex.org/W3203701986","https://openalex.org/W3205586691","https://openalex.org/W4214704440","https://openalex.org/W4214713996","https://openalex.org/W4214755140","https://openalex.org/W4226106508","https://openalex.org/W4287025408","https://openalex.org/W4312903973","https://openalex.org/W4313145913","https://openalex.org/W6739663239","https://openalex.org/W6739778489","https://openalex.org/W6763422710","https://openalex.org/W6784333009","https://openalex.org/W6810249204","https://openalex.org/W6839446344"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W3119773509","https://openalex.org/W3208297503","https://openalex.org/W2889153461","https://openalex.org/W2964117661","https://openalex.org/W4388405611"],"abstract_inverted_index":{"Semantic":[0],"segmentation":[1,177,195],"in":[2,28],"complex":[3],"scenes":[4],"relies":[5],"not":[6],"only":[7],"on":[8,13,125,147,183,203,209],"object":[9,14],"appearance":[10],"but":[11],"also":[12],"location":[15],"and":[16,104,128,139,150,170,185,188,205,221,231],"the":[17,29,37,53,67,111,114,132,156,225],"surrounding":[18],"environment.":[19],"Nonetheless,":[20],"it":[21],"is":[22,168],"difficult":[23],"to":[24,36,65,83,159],"model":[25],"long-range":[26,227],"context":[27,228],"format":[30],"of":[31,56,60,98,122,235],"pairwise":[32],"point":[33,43,57,85,153],"correlations":[34,82],"due":[35],"huge":[38],"computational":[39,68,213],"cost":[40,214],"for":[41],"large-scale":[42],"clouds.":[44],"In":[45,110,131],"this":[46],"paper,":[47],"we":[48,135],"propose":[49],"using":[50],"regions":[51,123],"as":[52],"intermediate":[54],"representation":[55],"clouds":[58],"instead":[59],"fine-grained":[61],"points":[62,116],"or":[63],"voxels":[64],"reduce":[66],"burden.":[69],"We":[70,88,179],"introduce":[71],"a":[72,90,99,105,120,144],"novel":[73],"Region-Enhanced":[74],"Feature":[75],"Learning":[76],"Network":[77],"(REFL-Net)":[78],"that":[79],"leverages":[80],"region":[81,148,157],"enhance":[84],"feature":[86,92],"learning.":[87],"design":[89],"region-based":[91],"enhancement":[93],"(RFE)":[94],"module,":[95],"which":[96],"consists":[97],"Semantic-Spatial":[100],"Region":[101,106],"Extraction":[102],"stage":[103],"Dependency":[107],"Modeling":[108],"stage.":[109],"first":[112],"stage,":[113,134],"input":[115],"are":[117],"grouped":[118],"into":[119],"set":[121],"based":[124],"their":[126],"semantic":[127,138,176],"spatial":[129,140],"proximity.":[130],"second":[133],"explore":[136],"inter-region":[137],"relationships":[141],"by":[142],"employing":[143],"self-attention":[145],"block":[146],"features":[149,154,158],"then":[151],"fuse":[152],"with":[155,174,193,211,216],"obtain":[160],"more":[161],"discriminative":[162],"representations.":[163],"Our":[164,197],"proposed":[165],"RFE":[166,191],"module":[167,192],"plug-and-play":[169],"can":[171],"be":[172],"integrated":[173],"common":[175],"backbones.":[178,196],"conduct":[180],"extensive":[181],"experiments":[182],"ScanNetV2":[184,204],"S3DIS":[186,210],"datasets":[187],"evaluate":[189],"our":[190,236],"different":[194],"REFL-Net":[198],"achieves":[199],"1.8%":[200],"mIoU":[201,207],"gain":[202,208],"1.7%":[206],"negligible":[212],"compared":[215],"backbone":[217],"models.":[218],"Both":[219],"quantitative":[220],"qualitative":[222],"results":[223],"show":[224],"powerful":[226],"modeling":[229],"ability":[230,234],"strong":[232],"generalization":[233],"REFL-Net.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
