{"id":"https://openalex.org/W4389041252","doi":"https://doi.org/10.1109/csit61576.2023.10324276","title":"Transforming Semantic Segmentation into Instance Segmentation with a Guided U-Net","display_name":"Transforming Semantic Segmentation into Instance Segmentation with a Guided U-Net","publication_year":2023,"publication_date":"2023-10-19","ids":{"openalex":"https://openalex.org/W4389041252","doi":"https://doi.org/10.1109/csit61576.2023.10324276"},"language":"en","primary_location":{"id":"doi:10.1109/csit61576.2023.10324276","is_oa":false,"landing_page_url":"https://doi.org/10.1109/csit61576.2023.10324276","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 18th International Conference on Computer Science and Information Technologies (CSIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092373483","display_name":"Roman Lavrynenko","orcid":"https://orcid.org/0000-0003-1969-1107"},"institutions":[{"id":"https://openalex.org/I107158390","display_name":"Kharkiv National University of Radio Electronics","ror":"https://ror.org/01ctj1b90","country_code":"UA","type":"education","lineage":["https://openalex.org/I107158390"]},{"id":"https://openalex.org/I8765205","display_name":"V. N. Karazin Kharkiv National University","ror":"https://ror.org/03ftejk10","country_code":"UA","type":"education","lineage":["https://openalex.org/I8765205"]}],"countries":["UA"],"is_corresponding":true,"raw_author_name":"Roman Lavrynenko","raw_affiliation_strings":["Kharkiv National University of Radio Electronics,Artificial Intelligence department,Kharkiv,Ukraine"],"affiliations":[{"raw_affiliation_string":"Kharkiv National University of Radio Electronics,Artificial Intelligence department,Kharkiv,Ukraine","institution_ids":["https://openalex.org/I8765205","https://openalex.org/I107158390"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072662545","display_name":"Nataliya Ryabova","orcid":"https://orcid.org/0000-0002-3608-6163"},"institutions":[{"id":"https://openalex.org/I8765205","display_name":"V. N. Karazin Kharkiv National University","ror":"https://ror.org/03ftejk10","country_code":"UA","type":"education","lineage":["https://openalex.org/I8765205"]},{"id":"https://openalex.org/I107158390","display_name":"Kharkiv National University of Radio Electronics","ror":"https://ror.org/01ctj1b90","country_code":"UA","type":"education","lineage":["https://openalex.org/I107158390"]}],"countries":["UA"],"is_corresponding":false,"raw_author_name":"Nataliya Ryabova","raw_affiliation_strings":["Kharkiv National University of Radio Electronics,Artificial Intelligence department,Kharkiv,Ukraine"],"affiliations":[{"raw_affiliation_string":"Kharkiv National University of Radio Electronics,Artificial Intelligence department,Kharkiv,Ukraine","institution_ids":["https://openalex.org/I8765205","https://openalex.org/I107158390"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5092373483"],"corresponding_institution_ids":["https://openalex.org/I107158390","https://openalex.org/I8765205"],"apc_list":null,"apc_paid":null,"fwci":0.3704,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.61329021,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8744634389877319},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7413149476051331},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.641276478767395},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.6032639145851135},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.5749828815460205},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5551620125770569},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5144565105438232},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4945509135723114},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4456685483455658},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.44489872455596924},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.4360877275466919},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.433454692363739},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3855486214160919}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8744634389877319},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7413149476051331},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.641276478767395},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.6032639145851135},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.5749828815460205},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5551620125770569},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5144565105438232},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4945509135723114},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4456685483455658},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.44489872455596924},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.4360877275466919},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.433454692363739},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3855486214160919},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/csit61576.2023.10324276","is_oa":false,"landing_page_url":"https://doi.org/10.1109/csit61576.2023.10324276","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE 18th International Conference on Computer Science and Information Technologies (CSIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.4300000071525574,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2557889580","https://openalex.org/W2884822772","https://openalex.org/W2911034023","https://openalex.org/W2911495555","https://openalex.org/W2963150697","https://openalex.org/W3184439416","https://openalex.org/W4312781473","https://openalex.org/W6752558437","https://openalex.org/W6798838024"],"related_works":["https://openalex.org/W3144569342","https://openalex.org/W2945274617","https://openalex.org/W2185902295","https://openalex.org/W2103507220","https://openalex.org/W2055202857","https://openalex.org/W2371519352","https://openalex.org/W4205800335","https://openalex.org/W2386644571","https://openalex.org/W2372421320","https://openalex.org/W2551987074"],"abstract_inverted_index":{"Traditional":[0],"approaches":[1],"to":[2,39,62,69,148],"instance":[3,31,41],"segmentation":[4,24,42,50,99,172],"typically":[5],"rely":[6,152],"on":[7,141,153],"the":[8,14,27,45,48,79,82,94,97,102,106,123,127,178],"utilization":[9],"of":[10,47,72,81,92],"object":[11],"detectors":[12],"in":[13,146,166],"initial":[15],"phase.":[16,51],"In":[17],"contrast,":[18],"our":[19,138],"approach":[20,139],"leverages":[21],"a":[22,35,58,63,66,90,110,120,132,142,169],"semantic":[23,49,98,171],"model":[25,173],"as":[26],"foundational":[28],"stage":[29],"for":[30,180],"segmentation.":[32],"We":[33],"introduce":[34],"novel":[36],"\u201cGuided":[37],"U-Net\u201d":[38],"extract":[40],"masks":[43],"from":[44,101],"output":[46,100],"Inspired":[52],"by":[53],"educational":[54],"strategies,":[55],"we":[56],"incorporate":[57],"\u201cguide\u201d":[59],"mechanism":[60],"akin":[61],"teacher":[64],"directing":[65],"student\u2019s":[67],"attention":[68],"specific":[70],"regions":[71],"an":[73,117],"image":[74],"and":[75,105,126,177],"prompting":[76],"inquiries":[77],"about":[78],"boundaries":[80],"indicated":[83],"instance.The":[84],"Guided":[85],"U-Net":[86],"is":[87,135,174],"trained":[88],"using":[89],"triad":[91],"inputs:":[93],"original":[95],"image,":[96],"primary":[103],"stage,":[104],"guide\u2014a":[107],"matrix":[108],"containing":[109],"single":[111],"white":[112],"dot":[113],"placed":[114],"randomly":[115],"within":[116],"instance.":[118],"Through":[119],"comparison":[121],"between":[122],"predicted":[124],"mask":[125],"corresponding":[128],"ground":[129],"truth":[130],"mask,":[131],"loss":[133,144,155],"value":[134],"computed.":[136],"Remarkably,":[137],"capitalizes":[140],"straightforward":[143],"function,":[145],"contrast":[147],"contemporary":[149],"models":[150],"that":[151],"intricate":[154],"functions":[156],"requiring":[157],"weight":[158],"tuning.":[159],"The":[160],"proposed":[161],"method":[162],"shows":[163],"promise,":[164],"particularly":[165],"scenarios":[167],"where":[168],"well-trained":[170],"already":[175],"available":[176],"need":[179],"instance-level":[181],"detail":[182],"arises.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
