{"id":"https://openalex.org/W3199130398","doi":"https://doi.org/10.1109/tmm.2021.3114541","title":"Bridging the Gap Between Semantic Segmentation and Instance Segmentation","display_name":"Bridging the Gap Between Semantic Segmentation and Instance Segmentation","publication_year":2021,"publication_date":"2021-09-22","ids":{"openalex":"https://openalex.org/W3199130398","doi":"https://doi.org/10.1109/tmm.2021.3114541","mag":"3199130398"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2021.3114541","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3114541","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031741238","display_name":"Chengxiang Yin","orcid":"https://orcid.org/0000-0002-3238-960X"},"institutions":[{"id":"https://openalex.org/I70983195","display_name":"Syracuse University","ror":"https://ror.org/025r5qe02","country_code":"US","type":"education","lineage":["https://openalex.org/I70983195"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Chengxiang Yin","raw_affiliation_strings":["Department of Electrical Engineering and Computer Science, Syracuse University, Syracuse, NY, U.S"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Computer Science, Syracuse University, Syracuse, NY, U.S","institution_ids":["https://openalex.org/I70983195"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039176528","display_name":"Jian Tang","orcid":"https://orcid.org/0000-0003-4418-0114"},"institutions":[{"id":"https://openalex.org/I4210093653","display_name":"Midea Group (China)","ror":"https://ror.org/006fm2278","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210093653"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Tang","raw_affiliation_strings":["Midea Group, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Midea Group, Shanghai, China","institution_ids":["https://openalex.org/I4210093653"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042100540","display_name":"Tongtong Yuan","orcid":"https://orcid.org/0000-0002-8224-9891"},"institutions":[{"id":"https://openalex.org/I37796252","display_name":"Beijing University of Technology","ror":"https://ror.org/037b1pp87","country_code":"CN","type":"education","lineage":["https://openalex.org/I37796252"]},{"id":"https://openalex.org/I70983195","display_name":"Syracuse University","ror":"https://ror.org/025r5qe02","country_code":"US","type":"education","lineage":["https://openalex.org/I70983195"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Tongtong Yuan","raw_affiliation_strings":["Beijing University of Technology, Beijing, China","Syracuse University, Syracuse, New York, United States"],"affiliations":[{"raw_affiliation_string":"Beijing University of Technology, Beijing, China","institution_ids":["https://openalex.org/I37796252"]},{"raw_affiliation_string":"Syracuse University, Syracuse, New York, United States","institution_ids":["https://openalex.org/I70983195"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047324704","display_name":"Zhiyuan Xu","orcid":"https://orcid.org/0000-0003-2879-3244"},"institutions":[{"id":"https://openalex.org/I4210093653","display_name":"Midea Group (China)","ror":"https://ror.org/006fm2278","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210093653"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyuan Xu","raw_affiliation_strings":["Midea Group, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Midea Group, Shanghai, China","institution_ids":["https://openalex.org/I4210093653"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100651384","display_name":"Yanzhi Wang","orcid":"https://orcid.org/0000-0002-3024-7990"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yanzhi Wang","raw_affiliation_strings":["Department of Electrical and Engineering, Northeastern University, Boston, MA, United States"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Engineering, Northeastern University, Boston, MA, United States","institution_ids":["https://openalex.org/I12912129"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5031741238"],"corresponding_institution_ids":["https://openalex.org/I70983195"],"apc_list":null,"apc_paid":null,"fwci":4.6623,"has_fulltext":false,"cited_by_count":79,"citation_normalized_percentile":{"value":0.96058397,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"24","issue":null,"first_page":"4183","last_page":"4196"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.86661696434021},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8319133520126343},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.70451420545578},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.5795040726661682},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5459876656532288},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.5122596621513367},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4625707268714905},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.42729055881500244},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4161027669906616},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4034404158592224}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.86661696434021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8319133520126343},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.70451420545578},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.5795040726661682},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5459876656532288},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.5122596621513367},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4625707268714905},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.42729055881500244},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4161027669906616},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4034404158592224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2021.3114541","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2021.3114541","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.75,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":76,"referenced_works":["https://openalex.org/W845365781","https://openalex.org/W1861492603","https://openalex.org/W1903029394","https://openalex.org/W2117539524","https://openalex.org/W2125389028","https://openalex.org/W2216125271","https://openalex.org/W2319083191","https://openalex.org/W2322480645","https://openalex.org/W2331128040","https://openalex.org/W2340897893","https://openalex.org/W2555182955","https://openalex.org/W2557889580","https://openalex.org/W2558156561","https://openalex.org/W2560023338","https://openalex.org/W2593414223","https://openalex.org/W2594519801","https://openalex.org/W2595519089","https://openalex.org/W2605482930","https://openalex.org/W2608858501","https://openalex.org/W2630837129","https://openalex.org/W2742400085","https://openalex.org/W2744404335","https://openalex.org/W2777795072","https://openalex.org/W2787091153","https://openalex.org/W2809110088","https://openalex.org/W2888965908","https://openalex.org/W2890498246","https://openalex.org/W2894903065","https://openalex.org/W2902499724","https://openalex.org/W2956887593","https://openalex.org/W2962676885","https://openalex.org/W2963037989","https://openalex.org/W2963073614","https://openalex.org/W2963136578","https://openalex.org/W2963150697","https://openalex.org/W2963167763","https://openalex.org/W2963307106","https://openalex.org/W2963350373","https://openalex.org/W2963393688","https://openalex.org/W2963659353","https://openalex.org/W2963775509","https://openalex.org/W2963800363","https://openalex.org/W2963849369","https://openalex.org/W2963857746","https://openalex.org/W2964217532","https://openalex.org/W2964236837","https://openalex.org/W2964252655","https://openalex.org/W2965182628","https://openalex.org/W2981689412","https://openalex.org/W2982770724","https://openalex.org/W2993182889","https://openalex.org/W2999219213","https://openalex.org/W3034428102","https://openalex.org/W3035049382","https://openalex.org/W3099155473","https://openalex.org/W3106546328","https://openalex.org/W3106651317","https://openalex.org/W3121626821","https://openalex.org/W3122445164","https://openalex.org/W3196904463","https://openalex.org/W3214910576","https://openalex.org/W4214613769","https://openalex.org/W4293406525","https://openalex.org/W4293584584","https://openalex.org/W4295602020","https://openalex.org/W6631190155","https://openalex.org/W6678815747","https://openalex.org/W6684665197","https://openalex.org/W6717372056","https://openalex.org/W6739696289","https://openalex.org/W6750227808","https://openalex.org/W6751290860","https://openalex.org/W6754899465","https://openalex.org/W6756512664","https://openalex.org/W6757855356","https://openalex.org/W6789654255"],"related_works":["https://openalex.org/W1669643531","https://openalex.org/W1967061043","https://openalex.org/W2549936415","https://openalex.org/W2384989255","https://openalex.org/W2566648451","https://openalex.org/W1982826852","https://openalex.org/W2517104666","https://openalex.org/W134976887","https://openalex.org/W2274529912","https://openalex.org/W2021143974"],"abstract_inverted_index":{"Fine-grained":[0],"instance":[1,14,51,60,66,146],"segmentation":[2,15,49,52,72,122,143,153],"is":[3,29,91,131,154],"considerably":[4],"more":[5],"complicated":[6],"and":[7,50,84,97,148,168,178,196,208,222,224],"challenging":[8],"than":[9],"semantic":[10,48,71,121,142,152],"segmentation.":[11,187],"Most":[12],"existing":[13],"methods":[16],"only":[17],"focus":[18],"on":[19,93,191],"accuracy":[20],"without":[21],"paying":[22],"much":[23],"attention":[24],"to":[25,31,43,69,104,174,185,232],"inference":[26],"latency,":[27],"which,":[28],"critical":[30],"real-time":[32,57,128,214],"applications,":[33],"such":[34],"as":[35],"autonomous":[36],"driving.":[37],"In":[38],"this":[39],"paper,":[40],"we":[41],"aim":[42],"bridge":[44],"the":[45,112,150,192,212],"gap":[46],"between":[47],"by":[53,73],"presenting":[54],"a":[55,70,85,106,127],"novel":[56],"model":[58,144],"for":[59,145],"segmentation,":[61,147],"Sem2Ins,":[62,203],"which":[63],"effectively":[64],"generates":[65],"boundaries":[67],"according":[68],"leveraging":[74],"conditional":[75],"generative":[76],"adversarial":[77],"networks":[78],"(cGANs)":[79],"coupled":[80],"with":[81,118,140,206,228],"deep":[82,166],"supervision":[83,90,167],"weighted":[86,169],"fusion":[87,170],"layer.":[88],"Specifically,":[89],"imposed":[92],"each":[94],"output":[95],"layer,":[96],"features":[98],"from":[99],"different":[100],"levels":[101],"are":[102],"fused":[103],"produce":[105],"well-generated":[107],"boundary":[108],"map.":[109],"Sem2Ins":[110,124,137,157,180,226],"has":[111],"following":[113],"desirable":[114],"features:":[115],"1)":[116,202],"Combined":[117],"some":[119,233],"fast":[120],"methods,":[123],"runs":[125],"at":[126],"speed":[129,221],"that":[130,201],"fairly":[132],"well-balanced":[133],"against":[134],"accuracy;":[135,164,223],"2)":[136,225],"works":[138],"flexibly":[139],"any":[141],"if":[149],"given":[151],"sufficiently":[155],"good,":[156],"even":[158],"achieves":[159],"state-of-the-art":[160,213],"in":[161,217],"terms":[162,218],"of":[163,219],"3)":[165],"can":[171,181],"be":[172,182],"leveraged":[173],"generate":[175],"high-quality":[176],"boundaries;":[177],"4)":[179],"easily":[183],"extended":[184],"panoptic":[186],"Extensive":[188],"experiments":[189],"performed":[190],"Cityscapes,":[193],"WildDash,":[194],"KITTI":[195],"COCO":[197],"benchmarks":[198],"have":[199],"demonstrated":[200],"when":[204],"combined":[205,227],"PSPNet":[207],"DDRNet-23-Slim,":[209],"consistently":[210],"outperforms":[211],"solution":[215],"(Box2Pix)":[216],"both":[220],"DPC":[229],"performs":[230],"comparably":[231],"powerful":[234],"detect-and-segment":[235],"approaches.":[236]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":33},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":3}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
