{"id":"https://openalex.org/W4416707046","doi":"https://doi.org/10.1109/tcsvt.2025.3637212","title":"SEMat: Semantic Enhanced Natural Image Interactive Matting","display_name":"SEMat: Semantic Enhanced Natural Image Interactive Matting","publication_year":2025,"publication_date":"2025-11-26","ids":{"openalex":"https://openalex.org/W4416707046","doi":"https://doi.org/10.1109/tcsvt.2025.3637212"},"language":null,"primary_location":{"id":"doi:10.1109/tcsvt.2025.3637212","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3637212","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080327203","display_name":"Ruihao Xia","orcid":"https://orcid.org/0009-0008-6749-5104"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruihao Xia","raw_affiliation_strings":["Key Laboratory of Smart Manufacturing in Energy Chemical Process, Ministry of Education, East China University of Science and Technology, Shanghai, China","Ministry of Education, Key Laboratory of Smart Manufacturing in Energy Chemical Process, East China University of Science and Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0008-6749-5104","affiliations":[{"raw_affiliation_string":"Key Laboratory of Smart Manufacturing in Energy Chemical Process, Ministry of Education, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"Ministry of Education, Key Laboratory of Smart Manufacturing in Energy Chemical Process, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yu Liang","orcid":"https://orcid.org/0009-0005-3357-6529"},"institutions":[{"id":"https://openalex.org/I180662265","display_name":"China Mobile (China)","ror":"https://ror.org/05gftfe97","country_code":"CN","type":"company","lineage":["https://openalex.org/I180662265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Liang","raw_affiliation_strings":["vivo Mobile Communication Company Ltd., Hangzhou, China","vivo Mobile Communication Co., Ltd., Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0005-3357-6529","affiliations":[{"raw_affiliation_string":"vivo Mobile Communication Company Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]},{"raw_affiliation_string":"vivo Mobile Communication Co., Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062345781","display_name":"Peng-Tao Jiang","orcid":"https://orcid.org/0000-0002-1786-4943"},"institutions":[{"id":"https://openalex.org/I180662265","display_name":"China Mobile (China)","ror":"https://ror.org/05gftfe97","country_code":"CN","type":"company","lineage":["https://openalex.org/I180662265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng-Tao Jiang","raw_affiliation_strings":["vivo Mobile Communication Company Ltd., Hangzhou, China","vivo Mobile Communication Co., Ltd., Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-1786-4943","affiliations":[{"raw_affiliation_string":"vivo Mobile Communication Company Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]},{"raw_affiliation_string":"vivo Mobile Communication Co., Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hao Zhang","orcid":"https://orcid.org/0009-0007-1175-5918"},"institutions":[{"id":"https://openalex.org/I180662265","display_name":"China Mobile (China)","ror":"https://ror.org/05gftfe97","country_code":"CN","type":"company","lineage":["https://openalex.org/I180662265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Zhang","raw_affiliation_strings":["vivo Mobile Communication Company Ltd., Hangzhou, China","vivo Mobile Communication Co., Ltd., Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0007-1175-5918","affiliations":[{"raw_affiliation_string":"vivo Mobile Communication Company Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]},{"raw_affiliation_string":"vivo Mobile Communication Co., Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101633158","display_name":"Qianru Sun","orcid":"https://orcid.org/0000-0003-2689-317X"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Qianru Sun","raw_affiliation_strings":["Singapore Management University, Bras Basah, Singapore","Singapore Management University, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-2689-317X","affiliations":[{"raw_affiliation_string":"Singapore Management University, Bras Basah, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028570509","display_name":"Yang Tang","orcid":"https://orcid.org/0000-0002-2750-8029"},"institutions":[{"id":"https://openalex.org/I143593769","display_name":"East China University of Science and Technology","ror":"https://ror.org/01vyrm377","country_code":"CN","type":"education","lineage":["https://openalex.org/I143593769"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Tang","raw_affiliation_strings":["Key Laboratory of Smart Manufacturing in Energy Chemical Process, Ministry of Education, East China University of Science and Technology, Shanghai, China","Ministry of Education, Key Laboratory of Smart Manufacturing in Energy Chemical Process, East China University of Science and Technology, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2750-8029","affiliations":[{"raw_affiliation_string":"Key Laboratory of Smart Manufacturing in Energy Chemical Process, Ministry of Education, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]},{"raw_affiliation_string":"Ministry of Education, Key Laboratory of Smart Manufacturing in Energy Chemical Process, East China University of Science and Technology, Shanghai, China","institution_ids":["https://openalex.org/I143593769"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100374366","display_name":"Bo Li","orcid":"https://orcid.org/0000-0001-7817-0665"},"institutions":[{"id":"https://openalex.org/I180662265","display_name":"China Mobile (China)","ror":"https://ror.org/05gftfe97","country_code":"CN","type":"company","lineage":["https://openalex.org/I180662265"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Li","raw_affiliation_strings":["vivo Mobile Communication Company Ltd., Hangzhou, China","vivo Mobile Communication Co., Ltd., Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-7817-0665","affiliations":[{"raw_affiliation_string":"vivo Mobile Communication Company Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]},{"raw_affiliation_string":"vivo Mobile Communication Co., Ltd., Hangzhou, China","institution_ids":["https://openalex.org/I180662265"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010883708","display_name":"Pan Zhou","orcid":"https://orcid.org/0000-0003-3400-8943"},"institutions":[{"id":"https://openalex.org/I79891267","display_name":"Singapore Management University","ror":"https://ror.org/050qmg959","country_code":"SG","type":"education","lineage":["https://openalex.org/I79891267"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Pan Zhou","raw_affiliation_strings":["Singapore Management University, Bras Basah, Singapore","Singapore Management University, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-3400-8943","affiliations":[{"raw_affiliation_string":"Singapore Management University, Bras Basah, Singapore","institution_ids":["https://openalex.org/I79891267"]},{"raw_affiliation_string":"Singapore Management University, Singapore","institution_ids":["https://openalex.org/I79891267"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5080327203"],"corresponding_institution_ids":["https://openalex.org/I143593769"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.35278887,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"36","issue":"4","first_page":"5329","last_page":"5343"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9685999751091003,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9685999751091003,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.007600000128149986,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.005400000140070915,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6601999998092651},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5235999822616577},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.46860000491142273},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4300999939441681},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37779998779296875},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3440000116825104},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.34119999408721924},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.3352000117301941}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8363999724388123},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6632999777793884},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6601999998092651},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5235999822616577},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.46860000491142273},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.46239998936653137},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4300999939441681},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37779998779296875},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3440000116825104},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.34119999408721924},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3352000117301941},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.32600000500679016},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3197000026702881},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.30979999899864197},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.3093999922275543},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3059000074863434},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2632000148296356},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3637212","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3637212","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5884386629","display_name":null,"funder_award_id":"U2441245","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7221376959","display_name":null,"funder_award_id":"U25B6002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7545332879","display_name":null,"funder_award_id":"62233005","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"approaches":[1],"attempt":[2],"to":[3,12,31,33,67,143,155,176,194],"adapt":[4],"powerful":[5],"interactive":[6,13,216],"segmentation":[7,65],"models,":[8],"such":[9],"as":[10],"SAM,":[11],"matting":[14,22,46,68,90,106,110,187],"and":[15,35,62,95,101,132,147,159,172,184],"fine-tune":[16],"the":[17,50,117,120,129,138,169,178,181,186,191,206],"models":[18,25],"based":[19,48],"on":[20,27,49],"synthetic":[21,28],"datasets.":[23],"However,":[24],"trained":[26],"data":[29],"fail":[30],"generalize":[32],"complex":[34,58,84],"occlusion":[36],"scenes.":[37],"We":[38],"address":[39],"this":[40],"challenge":[41],"by":[42,108],"proposing":[43],"a":[44,98,104],"new":[45],"dataset":[47],"COCO":[51,61],"dataset,":[52],"namely":[53],"COCO-Matting.":[54],"It":[55],"selects":[56],"real-world":[57],"images":[59],"from":[60,97,180,190],"converts":[63],"semantic":[64,197],"masks":[66,96,162],"labels.":[69],"The":[70,150],"built":[71],"COCO-Matting":[72],"comprises":[73],"an":[74],"extensive":[75],"collection":[76],"of":[77,119,209],"36,980":[78],"human":[79],"instance-level":[80],"alpha":[81],"mattes":[82],"in":[83,215],"natural":[85,217],"scenarios.":[86],"Furthermore,":[87],"existing":[88],"SAM-based":[89],"methods":[91],"extract":[92,144],"intermediate":[93],"features":[94],"frozen":[99],"SAM":[100],"only":[102],"train":[103],"lightweight":[105],"decoder":[107,153,193],"end-to-end":[109],"losses,":[111],"which":[112,127],"do":[113],"not":[114],"fully":[115],"exploit":[116],"potential":[118],"pre-trained":[121,182],"SAM.":[122],"Thus,":[123],"we":[124],"propose":[125],"SEMat":[126],"revamps":[128],"network":[130,136],"architecture":[131],"training":[133,167],"objectives.":[134],"For":[135,166],"architecture,":[137],"proposed":[139,151,170],"feature-aligned":[140],"transformer":[141],"learns":[142],"fine-grained":[145],"edge":[146],"transparency":[148],"features.":[149],"matte-aligned":[152],"aims":[154],"segment":[156],"matting-specific":[157],"objects":[158],"convert":[160],"coarse":[161],"into":[163],"high-precision":[164],"mattes.":[165],"objectives,":[168],"regularization":[171],"trimap":[173],"loss":[174],"aim":[175],"retain":[177],"prior":[179],"model":[183],"push":[185],"logits":[188],"extracted":[189],"mask":[192],"contain":[195],"trimap-based":[196],"information.":[198],"Extensive":[199],"experiments":[200],"across":[201],"seven":[202],"diverse":[203],"datasets":[204],"demonstrate":[205],"superior":[207],"performance":[208],"our":[210],"method,":[211],"proving":[212],"its":[213],"efficacy":[214],"image":[218],"matting.":[219],"Code":[220],"is":[221],"available":[222],"at":[223],"https://github.com/XiaRho/SEMat.":[224]},"counts_by_year":[],"updated_date":"2026-04-07T06:01:17.266235","created_date":"2025-11-27T00:00:00"}
