{"id":"https://openalex.org/W4362654014","doi":"https://doi.org/10.1109/tmm.2023.3264883","title":"A Unified Transformer Framework for Group-Based Segmentation: Co-Segmentation, Co-Saliency Detection and Video Salient Object Detection","display_name":"A Unified Transformer Framework for Group-Based Segmentation: Co-Segmentation, Co-Saliency Detection and Video Salient Object Detection","publication_year":2023,"publication_date":"2023-04-05","ids":{"openalex":"https://openalex.org/W4362654014","doi":"https://doi.org/10.1109/tmm.2023.3264883"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3264883","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3264883","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003812660","display_name":"Yukun Su","orcid":"https://orcid.org/0000-0001-6942-3528"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yukun Su","raw_affiliation_strings":["School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-6942-3528","affiliations":[{"raw_affiliation_string":"School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083709004","display_name":"Jingliang Deng","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingliang Deng","raw_affiliation_strings":["School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029998379","display_name":"Ruizhou Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruizhou Sun","raw_affiliation_strings":["School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software Engineering, Key Laboratory of Big Data and Intelligent Robot, Ministry of Education, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029912845","display_name":"Guosheng Lin","orcid":"https://orcid.org/0000-0002-0329-7458"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Guosheng Lin","raw_affiliation_strings":["School of Computer Science and Engineering, Nanyang Technological University, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-0329-7458","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076885058","display_name":"Hanjing Su","orcid":"https://orcid.org/0000-0003-3317-2303"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanjing Su","raw_affiliation_strings":["Tencent, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Tencent, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023130798","display_name":"Qingyao Wu","orcid":"https://orcid.org/0000-0002-6771-3932"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingyao Wu","raw_affiliation_strings":["School of Software Engineering, Pazhou Lab, South China University, Guangzhou, China","Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-6771-3932","affiliations":[{"raw_affiliation_string":"School of Software Engineering, Pazhou Lab, South China University, Guangzhou, China","institution_ids":[]},{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5003812660"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":14.1513,"has_fulltext":false,"cited_by_count":126,"citation_normalized_percentile":{"value":0.99345596,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"26","issue":null,"first_page":"313","last_page":"325"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8436518907546997},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5984907150268555},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5883757472038269},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5851807594299316},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5076745748519897},{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.45953062176704407},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4486079216003418},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43373245000839233},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42878013849258423},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3316307067871094},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.10399094223976135},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09525135159492493}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8436518907546997},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5984907150268555},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5883757472038269},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5851807594299316},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5076745748519897},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.45953062176704407},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4486079216003418},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43373245000839233},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42878013849258423},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3316307067871094},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.10399094223976135},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09525135159492493}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3264883","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3264883","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2048204237","display_name":null,"funder_award_id":"62272172","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3220463999","display_name":null,"funder_award_id":"AISG-RP-2018-003","funder_id":"https://openalex.org/F4320320709","funder_display_name":"National Research Foundation Singapore"},{"id":"https://openalex.org/G5695494393","display_name":null,"funder_award_id":"2023A1515012920","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G8183260716","display_name":null,"funder_award_id":"2019TQ05X200","funder_id":"https://openalex.org/F4320327806","funder_display_name":"Tip-top Scientific and Technical Innovative Youth Talents of Guangdong Special Support Program"}],"funders":[{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320327806","display_name":"Tip-top Scientific and Technical Innovative Youth Talents of Guangdong Special Support Program","ror":null},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":112,"referenced_works":["https://openalex.org/W21025885","https://openalex.org/W1522301498","https://openalex.org/W1522734439","https://openalex.org/W1528789833","https://openalex.org/W1686810756","https://openalex.org/W1797268635","https://openalex.org/W1861492603","https://openalex.org/W1914179642","https://openalex.org/W1964884769","https://openalex.org/W1966601141","https://openalex.org/W1970958500","https://openalex.org/W1982075130","https://openalex.org/W1986811142","https://openalex.org/W1992992668","https://openalex.org/W1996140089","https://openalex.org/W1996326832","https://openalex.org/W2037227137","https://openalex.org/W2064675550","https://openalex.org/W2076756823","https://openalex.org/W2100470808","https://openalex.org/W2110019070","https://openalex.org/W2118802082","https://openalex.org/W2132914434","https://openalex.org/W2138682569","https://openalex.org/W2143668817","https://openalex.org/W2157244733","https://openalex.org/W2194775991","https://openalex.org/W2293332611","https://openalex.org/W2295107390","https://openalex.org/W2412782625","https://openalex.org/W2415053570","https://openalex.org/W2470139095","https://openalex.org/W2474265885","https://openalex.org/W2518666399","https://openalex.org/W2529603763","https://openalex.org/W2560474170","https://openalex.org/W2565639579","https://openalex.org/W2585592883","https://openalex.org/W2740667773","https://openalex.org/W2747199123","https://openalex.org/W2750988638","https://openalex.org/W2787091153","https://openalex.org/W2793029440","https://openalex.org/W2800632947","https://openalex.org/W2807912089","https://openalex.org/W2889986507","https://openalex.org/W2894890793","https://openalex.org/W2895340898","https://openalex.org/W2896011443","https://openalex.org/W2904945062","https://openalex.org/W2916743882","https://openalex.org/W2916798096","https://openalex.org/W2939217524","https://openalex.org/W2942939335","https://openalex.org/W2943125866","https://openalex.org/W2948937967","https://openalex.org/W2955084925","https://openalex.org/W2961348656","https://openalex.org/W2962974533","https://openalex.org/W2963091558","https://openalex.org/W2963529609","https://openalex.org/W2963868681","https://openalex.org/W2964283970","https://openalex.org/W2964429685","https://openalex.org/W2965638232","https://openalex.org/W2969626490","https://openalex.org/W2972640707","https://openalex.org/W2981680738","https://openalex.org/W2981723426","https://openalex.org/W2982083293","https://openalex.org/W2984144959","https://openalex.org/W2986056979","https://openalex.org/W2987391422","https://openalex.org/W2987701848","https://openalex.org/W2990844506","https://openalex.org/W2990984982","https://openalex.org/W2997217064","https://openalex.org/W2997788879","https://openalex.org/W3012255272","https://openalex.org/W3012573144","https://openalex.org/W3016163669","https://openalex.org/W3018757597","https://openalex.org/W3035242260","https://openalex.org/W3035666869","https://openalex.org/W3039991645","https://openalex.org/W3044364325","https://openalex.org/W3047057232","https://openalex.org/W3096289386","https://openalex.org/W3108043693","https://openalex.org/W3108981297","https://openalex.org/W3119667975","https://openalex.org/W3127947687","https://openalex.org/W3172675153","https://openalex.org/W3173349970","https://openalex.org/W3174178235","https://openalex.org/W3201844719","https://openalex.org/W3202242435","https://openalex.org/W3202424564","https://openalex.org/W3203879378","https://openalex.org/W3216044769","https://openalex.org/W4214542306","https://openalex.org/W4225986700","https://openalex.org/W4287684771","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6638319203","https://openalex.org/W6759534164","https://openalex.org/W6763422710","https://openalex.org/W6777046832","https://openalex.org/W6780226713","https://openalex.org/W6782657842","https://openalex.org/W6803376173"],"related_works":["https://openalex.org/W4376620596","https://openalex.org/W3177249605","https://openalex.org/W2534152068","https://openalex.org/W4299545679","https://openalex.org/W3138508047","https://openalex.org/W1972515067","https://openalex.org/W1689909837","https://openalex.org/W4293054914","https://openalex.org/W4313315626","https://openalex.org/W2963418361"],"abstract_inverted_index":{"Humans":[0],"tend":[1],"to":[2,44,64,66,72,96,158,174,177,181],"mine":[3],"objects":[4],"by":[5,234],"learning":[6,172],"from":[7,100],"a":[8,21,84,93,101,131,140],"group":[9,85],"of":[10,15,76,86],"images":[11],"or":[12],"several":[13],"frames":[14],"video":[16,39],"since":[17],"we":[18,91,128,168],"live":[19],"in":[20,229,245],"dynamic":[22],"world.":[23],"In":[24,88],"the":[25,46,77,136,150,156,160,164,179,236],"computer":[26],"vision":[27],"area,":[28],"many":[29],"researchers":[30],"focus":[31],"on":[32,187,225],"co-segmentation":[33],"(CoS),":[34],"co-saliency":[35],"detection":[36,42],"(CoSD)":[37],"and":[38,60,81,143,194,201,203,216,232],"salient":[40],"object":[41],"(VSOD)":[43],"discover":[45],"co-occurrent":[47],"objects.":[48,166],"However,":[49],"previous":[50],"approaches":[51],"design":[52],"different":[53,227],"networks":[54],"for":[55,118],"these":[56,98],"similar":[57],"tasks":[58,228],"separately,":[59],"they":[61,70],"are":[62],"difficult":[63],"apply":[65],"each":[67],"other.":[68],"Besides,":[69],"fail":[71],"take":[73],"full":[74],"advantage":[75],"cues":[78],"among":[79,163],"inter-":[80],"intra-feature":[82],"within":[83],"images.":[87],"this":[89],"paper,":[90],"introduce":[92,130],"unified":[94,102],"framework":[95],"tackle":[97],"issues":[99],"view,":[103],"term":[104],"as":[105,139],"<bold":[106,110,114,119,123],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[107,111,115,120,124,209],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">UFGS</b>":[108],"(":[109],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">U</b>":[112],"nified":[113],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">F</b>":[116],"ramework":[117],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">G</b>":[121],"roup-based":[122],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">S</b>":[125],"egmentation).":[126],"Specifically,":[127],"first":[129],"transformer":[132],"block,":[133],"which":[134,240],"views":[135],"image":[137],"feature":[138],"patch":[141],"token":[142],"then":[144],"captures":[145],"their":[146],"long-range":[147],"dependencies":[148],"through":[149],"self-attention":[151],"mechanism.":[152],"This":[153],"can":[154,241],"help":[155],"network":[157,180,238],"excavate":[159],"patch-structured":[161],"similarities":[162],"relevant":[165],"Furthermore,":[167],"propose":[169],"an":[170],"intra-MLP":[171],"module":[173],"produce":[175],"self-mask":[176],"enhance":[178],"avoid":[182],"partial":[183],"activation.":[184],"Extensive":[185],"experiments":[186],"four":[188],"CoS":[189],"benchmarks":[190,198,206],"(PASCAL,":[191],"iCoseg":[192],"Internet":[193],"MSRC),":[195],"three":[196,226],"CoSD":[197],"(Cosal2015,":[199],"CoSOD3k,":[200],"CocA)":[202],"five":[204],"VSOD":[205],"(DAVIS":[207],"<inline-formula":[208],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[210],"notation=\"LaTeX\">$_{16}$</tex-math></inline-formula>":[211],",":[212],"FBMS,":[213],"ViSal,":[214],"SegV2,":[215],"DAVSOD)":[217],"show":[218],"that":[219],"our":[220],"method":[221],"outperforms":[222],"other":[223],"state-of-the-arts":[224],"both":[230],"accuracy":[231],"speed":[233],"using":[235],"same":[237],"architecture,":[239],"reach":[242],"140":[243],"FPS":[244],"real-time.":[246]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":50},{"year":2024,"cited_by_count":43},{"year":2023,"cited_by_count":23},{"year":2022,"cited_by_count":4}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
