{"id":"https://openalex.org/W3214707056","doi":"https://doi.org/10.1109/iccvw54120.2021.00301","title":"A Unified Efficient Pyramid Transformer for Semantic Segmentation","display_name":"A Unified Efficient Pyramid Transformer for Semantic Segmentation","publication_year":2021,"publication_date":"2021-10-01","ids":{"openalex":"https://openalex.org/W3214707056","doi":"https://doi.org/10.1109/iccvw54120.2021.00301","mag":"3214707056"},"language":"en","primary_location":{"id":"doi:10.1109/iccvw54120.2021.00301","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw54120.2021.00301","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082377384","display_name":"Fangrui Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fangrui Zhu","raw_affiliation_strings":["School of Data Science, Fudan University"],"affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019191351","display_name":"Yi Zhu","orcid":"https://orcid.org/0000-0002-6482-6712"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Zhu","raw_affiliation_strings":["Amazon Web Services"],"affiliations":[{"raw_affiliation_string":"Amazon Web Services","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100425703","display_name":"Li Zhang","orcid":"https://orcid.org/0000-0003-1031-5420"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Zhang","raw_affiliation_strings":["School of Data Science, Fudan University"],"affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089678310","display_name":"Chongruo Wu","orcid":"https://orcid.org/0000-0002-4569-5024"},"institutions":[{"id":"https://openalex.org/I84218800","display_name":"University of California, Davis","ror":"https://ror.org/05rrcem69","country_code":"US","type":"education","lineage":["https://openalex.org/I84218800"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chongruo Wu","raw_affiliation_strings":["University of California, Davis"],"affiliations":[{"raw_affiliation_string":"University of California, Davis","institution_ids":["https://openalex.org/I84218800"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084959430","display_name":"Yanwei Fu","orcid":"https://orcid.org/0000-0002-6595-6893"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanwei Fu","raw_affiliation_strings":["School of Data Science, Fudan University"],"affiliations":[{"raw_affiliation_string":"School of Data Science, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100399461","display_name":"Mu Li","orcid":"https://orcid.org/0000-0002-4433-2301"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mu Li","raw_affiliation_strings":["Amazon Web Services"],"affiliations":[{"raw_affiliation_string":"Amazon Web Services","institution_ids":["https://openalex.org/I1311688040"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5082377384"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":2.8821,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.92566993,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2667","last_page":"2677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8328624963760376},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7281787991523743},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5668771266937256},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5571698546409607},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.5562625527381897},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4882838726043701},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.4753967225551605},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.4349328279495239},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.39842426776885986},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.342949241399765},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3308752179145813},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3233252167701721},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.10464444756507874}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8328624963760376},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7281787991523743},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5668771266937256},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5571698546409607},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.5562625527381897},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4882838726043701},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.4753967225551605},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.4349328279495239},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39842426776885986},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.342949241399765},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3308752179145813},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3233252167701721},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.10464444756507874},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccvw54120.2021.00301","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw54120.2021.00301","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":107,"referenced_works":["https://openalex.org/W603908379","https://openalex.org/W1495267108","https://openalex.org/W1817277359","https://openalex.org/W1903029394","https://openalex.org/W1923697677","https://openalex.org/W2035990954","https://openalex.org/W2125215748","https://openalex.org/W2194775991","https://openalex.org/W2266390837","https://openalex.org/W2340897893","https://openalex.org/W2412782625","https://openalex.org/W2560023338","https://openalex.org/W2563705555","https://openalex.org/W2584471766","https://openalex.org/W2630837129","https://openalex.org/W2737258237","https://openalex.org/W2752782242","https://openalex.org/W2780664485","https://openalex.org/W2799166040","https://openalex.org/W2799213142","https://openalex.org/W2884822772","https://openalex.org/W2885139206","https://openalex.org/W2890782586","https://openalex.org/W2895340641","https://openalex.org/W2896457183","https://openalex.org/W2950045474","https://openalex.org/W2955058313","https://openalex.org/W2955813853","https://openalex.org/W2962872526","https://openalex.org/W2963307106","https://openalex.org/W2963318290","https://openalex.org/W2963727650","https://openalex.org/W2963840672","https://openalex.org/W2963971305","https://openalex.org/W2964252655","https://openalex.org/W2964254867","https://openalex.org/W2964309882","https://openalex.org/W2981689412","https://openalex.org/W2981793666","https://openalex.org/W2981899103","https://openalex.org/W2982220924","https://openalex.org/W2982631194","https://openalex.org/W2987761193","https://openalex.org/W2989684653","https://openalex.org/W2991471181","https://openalex.org/W2993235622","https://openalex.org/W3015468748","https://openalex.org/W3022261194","https://openalex.org/W3034345703","https://openalex.org/W3034634365","https://openalex.org/W3035339581","https://openalex.org/W3035358681","https://openalex.org/W3094502228","https://openalex.org/W3096653763","https://openalex.org/W3097065222","https://openalex.org/W3107113572","https://openalex.org/W3107497254","https://openalex.org/W3107634219","https://openalex.org/W3108186749","https://openalex.org/W3109196706","https://openalex.org/W3109301572","https://openalex.org/W3122239467","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3167260844","https://openalex.org/W3170841864","https://openalex.org/W3170874841","https://openalex.org/W3211490618","https://openalex.org/W3213165621","https://openalex.org/W4241071816","https://openalex.org/W4292779060","https://openalex.org/W4295838474","https://openalex.org/W4297665946","https://openalex.org/W4323654151","https://openalex.org/W4385245566","https://openalex.org/W6618372016","https://openalex.org/W6638480814","https://openalex.org/W6640295612","https://openalex.org/W6696085341","https://openalex.org/W6715287400","https://openalex.org/W6730845260","https://openalex.org/W6739696289","https://openalex.org/W6739901393","https://openalex.org/W6748481559","https://openalex.org/W6749010802","https://openalex.org/W6753421600","https://openalex.org/W6754123467","https://openalex.org/W6754713557","https://openalex.org/W6754879843","https://openalex.org/W6755207826","https://openalex.org/W6761628794","https://openalex.org/W6768371451","https://openalex.org/W6771194246","https://openalex.org/W6771626834","https://openalex.org/W6775170262","https://openalex.org/W6775845032","https://openalex.org/W6776048684","https://openalex.org/W6776782944","https://openalex.org/W6778883912","https://openalex.org/W6779387320","https://openalex.org/W6779806301","https://openalex.org/W6784094891","https://openalex.org/W6784333009","https://openalex.org/W6788135285","https://openalex.org/W6788620109","https://openalex.org/W6797399245","https://openalex.org/W6798837711"],"related_works":["https://openalex.org/W2140435402","https://openalex.org/W4285276086","https://openalex.org/W2161633202","https://openalex.org/W2039787362","https://openalex.org/W1750537857","https://openalex.org/W2163490908","https://openalex.org/W2901621883","https://openalex.org/W3022564861","https://openalex.org/W2657488695","https://openalex.org/W2394987862"],"abstract_inverted_index":{"Semantic":[0],"segmentation":[1,109],"is":[2,31,80],"a":[3,42,60,76],"challenging":[4],"problem":[5],"due":[6],"to":[7,46,64,82],"difficulties":[8],"in":[9,12,34,95],"modeling":[10,26],"context":[11,25,52,72],"complex":[13],"scenes":[14],"and":[15,54],"class":[16],"confusions":[17],"along":[18],"boundaries.":[19],"Most":[20],"literature":[21],"either":[22],"focuses":[23],"on":[24,103],"or":[27],"boundary":[28,55,87],"refinement,":[29],"which":[30],"less":[32],"generalizable":[33],"open-world":[35],"scenarios.":[36],"In":[37,74],"this":[38],"work,":[39],"we":[40],"advocate":[41],"unified":[43],"framework":[44],"(UN-EPT)":[45],"segment":[47],"objects":[48],"by":[49],"considering":[50],"both":[51],"information":[53],"artifacts.":[56],"We":[57,99],"first":[58],"adapt":[59],"sparse":[61],"sampling":[62],"strategy":[63],"incorporate":[65],"the":[66],"transformer-based":[67],"attention":[68],"mechanism":[69],"for":[70,86,107],"efficient":[71],"modeling.":[73],"addition,":[75],"separate":[77],"spatial":[78],"branch":[79],"introduced":[81],"capture":[83],"image":[84],"details":[85],"refinement.":[88],"The":[89],"whole":[90],"model":[91],"can":[92],"be":[93],"trained":[94],"an":[96],"end-to-end":[97],"manner.":[98],"demonstrate":[100],"promising":[101],"performance":[102],"three":[104],"popular":[105],"benchmarks":[106],"semantic":[108],"with":[110],"low":[111],"memory":[112],"footprint.":[113]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":13}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
