{"id":"https://openalex.org/W4390905042","doi":"https://doi.org/10.1109/tits.2023.3348795","title":"A Cross-Scale Hierarchical Transformer With Correspondence-Augmented Attention for Inferring Bird\u2019s-Eye-View Semantic Segmentation","display_name":"A Cross-Scale Hierarchical Transformer With Correspondence-Augmented Attention for Inferring Bird\u2019s-Eye-View Semantic Segmentation","publication_year":2024,"publication_date":"2024-01-16","ids":{"openalex":"https://openalex.org/W4390905042","doi":"https://doi.org/10.1109/tits.2023.3348795"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2023.3348795","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2023.3348795","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083747119","display_name":"Naiyu Fang","orcid":"https://orcid.org/0000-0003-0145-1690"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Naiyu Fang","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-0145-1690","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062424762","display_name":"Lemiao Qiu","orcid":"https://orcid.org/0000-0001-9358-0099"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lemiao Qiu","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-9358-0099","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041037485","display_name":"Shuyou Zhang","orcid":"https://orcid.org/0000-0001-9023-5361"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuyou Zhang","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-9023-5361","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693880","display_name":"Zili Wang","orcid":"https://orcid.org/0000-0002-5003-3092"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zili Wang","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-5003-3092","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047651979","display_name":"Kerui Hu","orcid":"https://orcid.org/0000-0002-8055-6468"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kerui Hu","raw_affiliation_strings":["State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-8055-6468","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Fluid Power and Mechatronic Systems, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022681712","display_name":"Kang Wang","orcid":"https://orcid.org/0000-0002-3664-0638"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Kang Wang","raw_affiliation_strings":["Hong Kong Polytechnic University, Hung Hom, Hong Kong","Hong Kong Polytechnic University, Hong Kong, Hong Kong"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University, Hung Hom, Hong Kong","institution_ids":["https://openalex.org/I14243506"]},{"raw_affiliation_string":"Hong Kong Polytechnic University, Hong Kong, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5083747119"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.9046,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.86081543,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"25","issue":"7","first_page":"7726","last_page":"7737"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7075231075286865},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6660361886024475},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6574166417121887},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5273360013961792},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4162772297859192},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.39762750267982483},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3836843967437744},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36504432559013367}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7075231075286865},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6660361886024475},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6574166417121887},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5273360013961792},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4162772297859192},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39762750267982483},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3836843967437744},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36504432559013367},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2023.3348795","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tits.2023.3348795","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8176451433","display_name":null,"funder_award_id":"52375271","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8232650804","display_name":null,"funder_award_id":"LY23E050011","funder_id":"https://openalex.org/F4320338464","funder_display_name":"Natural Science Foundation of Zhejiang Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320338464","display_name":"Natural Science Foundation of Zhejiang Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2194775991","https://openalex.org/W2284520540","https://openalex.org/W2732011728","https://openalex.org/W2752782242","https://openalex.org/W2798483995","https://openalex.org/W2885937160","https://openalex.org/W2890003176","https://openalex.org/W2908510526","https://openalex.org/W2948515602","https://openalex.org/W2955189650","https://openalex.org/W2963351448","https://openalex.org/W2963587345","https://openalex.org/W2964294967","https://openalex.org/W2971173446","https://openalex.org/W2971726345","https://openalex.org/W2998083489","https://openalex.org/W3010707748","https://openalex.org/W3034669477","https://openalex.org/W3035574168","https://openalex.org/W3043357436","https://openalex.org/W3100744475","https://openalex.org/W3102343027","https://openalex.org/W3109395584","https://openalex.org/W3109428934","https://openalex.org/W3138516171","https://openalex.org/W3174288891","https://openalex.org/W3175199633","https://openalex.org/W3209892767","https://openalex.org/W4205560903","https://openalex.org/W4214530037","https://openalex.org/W4280563105","https://openalex.org/W4281848959","https://openalex.org/W4286768331","https://openalex.org/W4289283268","https://openalex.org/W4297094385","https://openalex.org/W4312427473","https://openalex.org/W4312492443","https://openalex.org/W4312556291","https://openalex.org/W4312641958","https://openalex.org/W4312850715","https://openalex.org/W4312878643","https://openalex.org/W4312881242","https://openalex.org/W4312894406","https://openalex.org/W4313855650","https://openalex.org/W4319878682","https://openalex.org/W4323345754","https://openalex.org/W4327662038","https://openalex.org/W4379116594","https://openalex.org/W4386066137","https://openalex.org/W4386882931","https://openalex.org/W6756392615","https://openalex.org/W6757817989","https://openalex.org/W6762718338","https://openalex.org/W6784094891","https://openalex.org/W6790690058","https://openalex.org/W6839067270","https://openalex.org/W6839180059"],"related_works":["https://openalex.org/W2055243143","https://openalex.org/W4379231730","https://openalex.org/W4321636575","https://openalex.org/W2357796999","https://openalex.org/W2045526782","https://openalex.org/W2741131631","https://openalex.org/W4206178588","https://openalex.org/W4287635093","https://openalex.org/W3094491777","https://openalex.org/W3214715529"],"abstract_inverted_index":{"As":[0],"bird\u2019s-eye-view":[1],"(BEV)":[2],"semantic":[3,26,128,242],"segmentation":[4,27,129,243],"is":[5,32,147,202],"simple-to-visualize":[6],"and":[7,42,55,177,198,221,228],"easy-to-handle,":[8],"it":[9],"has":[10,236],"been":[11],"applied":[12],"in":[13,36,71,173,204,239],"autonomous":[14],"driving":[15],"to":[16,21,79,106,137,169,185,195],"provide":[17],"the":[18,37,53,67,72,76,81,108,139,144,151,156,166,179,214,219,222],"surrounding":[19],"information":[20,89,187],"downstream":[22],"tasks.":[23],"Inferring":[24],"BEV":[25,94,140,183,241],"conditioned":[28,244],"on":[29,245],"multi-camera-view":[30,246],"images":[31],"a":[33,119,134,174,205],"popular":[34],"scheme":[35],"community":[38],"as":[39],"cheap":[40],"devices":[41],"real-time":[43],"processing.":[44],"The":[45],"recent":[46],"work":[47],"implemented":[48,203],"this":[49,161],"task":[50],"by":[51,160],"learning":[52,69],"content":[54],"position":[56],"relationship":[57,68],"via":[58],"Vision":[59],"Transformer":[60,123,168],"(ViT).":[61],"However,":[62],"its":[63],"quadratic":[64],"complexity":[65],"confines":[66],"only":[70,148],"latent":[73],"layer,":[74],"leaving":[75],"scale":[77],"gap":[78],"impede":[80],"representation":[82],"of":[83,88,99,110,150,182],"fine-grained":[84],"objects.":[85],"In":[86],"view":[87,101],"absorption,":[90],"when":[91],"representing":[92],"position-related":[93],"features,":[95],"their":[96],"weighted":[97],"fusion":[98,109],"all":[100],"feature":[102,141,171],"imposes":[103],"inconducive":[104,199],"features":[105,184],"disturb":[107],"conducive":[111,197],"features.":[112],"To":[113,154],"tackle":[114],"these":[115],"issues,":[116],"we":[117,132,164],"propose":[118,192],"novel":[120],"cross-scale":[121,167],"hierarchical":[122,135,162],"with":[124],"correspondence-augmented":[125,193],"attention":[126,194,211,224],"for":[127],"inference.":[130],"Specifically,":[131],"devise":[133],"framework":[136],"refine":[138],"representation,":[142],"where":[143],"last":[145],"size":[146],"half":[149],"final":[152],"segmentation.":[153],"save":[155],"computation":[157],"increase":[158],"caused":[159],"framework,":[163],"exploit":[165],"learn":[170],"relationships":[172],"reversed-aligning":[175],"way,":[176,209],"leverage":[178],"residual":[180],"connection":[181],"facilitate":[186],"transmission":[188],"between":[189],"scales.":[190],"We":[191],"distinguish":[196],"correspondences.":[200],"It":[201],"simple":[206],"yet":[207],"effective":[208],"amplifying":[210],"scores":[212,225],"before":[213],"Softmax":[215],"operation,":[216],"so":[217],"that":[218,233],"position-view-related":[220],"position-view-disrelated":[223],"are":[226],"highlighted":[227],"suppressed.":[229],"Extensive":[230],"experiments":[231],"demonstrate":[232],"our":[234],"method":[235],"state-of-the-art":[237],"performance":[238],"inferring":[240],"images.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
