{"id":"https://openalex.org/W7162533675","doi":"https://doi.org/10.1109/3dv69130.2026.00152","title":"HiT: Hierarchical Transformers for Unsupervised 3D Shape Abstraction","display_name":"HiT: Hierarchical Transformers for Unsupervised 3D Shape Abstraction","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7162533675","doi":"https://doi.org/10.1109/3dv69130.2026.00152"},"language":null,"primary_location":{"id":"doi:10.1109/3dv69130.2026.00152","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00152","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088462108","display_name":"Aditya Vora","orcid":"https://orcid.org/0000-0002-6177-1912"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Aditya Vora","raw_affiliation_strings":["Simon Fraser University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025321001","display_name":"Lily Goli","orcid":null},"institutions":[{"id":"https://openalex.org/I185261750","display_name":"University of Toronto","ror":"https://ror.org/03dbr7087","country_code":"CA","type":"education","lineage":["https://openalex.org/I185261750"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Lily Goli","raw_affiliation_strings":["University of Toronto"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Toronto","institution_ids":["https://openalex.org/I185261750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037094498","display_name":"Andrea Tagliasacchi","orcid":"https://orcid.org/0000-0002-2209-7187"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Andrea Tagliasacchi","raw_affiliation_strings":["Simon Fraser University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100397026","display_name":"Hao Zhang","orcid":"https://orcid.org/0000-0003-1991-119X"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Hao Zhang","raw_affiliation_strings":["Simon Fraser University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.83850177,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1598","last_page":"1607"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.8561999797821045,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.8561999797821045,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.02319999970495701,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.014700000174343586,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.4489000141620636},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4471000134944916},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3346000015735626},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.23810000717639923}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6297000050544739},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5198000073432922},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.4489000141620636},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4471000134944916},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3424000144004822},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3188999891281128},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2538999915122986},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.23810000717639923},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.23309999704360962}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/3dv69130.2026.00152","is_oa":false,"landing_page_url":"https://doi.org/10.1109/3dv69130.2026.00152","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on 3D Vision (3DV)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1501418839","https://openalex.org/W1825507529","https://openalex.org/W1975807399","https://openalex.org/W1976645892","https://openalex.org/W2553307952","https://openalex.org/W2612843093","https://openalex.org/W2918473435","https://openalex.org/W2947464908","https://openalex.org/W2961368225","https://openalex.org/W2981657250","https://openalex.org/W2989341556","https://openalex.org/W2989673842","https://openalex.org/W3034700465","https://openalex.org/W3035046407","https://openalex.org/W3035163517","https://openalex.org/W3035333439","https://openalex.org/W3117476483","https://openalex.org/W3132401450","https://openalex.org/W3138516171","https://openalex.org/W3180251767","https://openalex.org/W3202589837","https://openalex.org/W3209873929","https://openalex.org/W3210613940","https://openalex.org/W4205189682","https://openalex.org/W4286616176","https://openalex.org/W4312433568","https://openalex.org/W4312566115","https://openalex.org/W4313118252","https://openalex.org/W4321512591","https://openalex.org/W4365441113","https://openalex.org/W4385275714","https://openalex.org/W4386066076","https://openalex.org/W4386071473","https://openalex.org/W4386071532","https://openalex.org/W4386071629","https://openalex.org/W4386075622","https://openalex.org/W4386075898","https://openalex.org/W4400582074","https://openalex.org/W4410027736"],"related_works":[],"abstract_inverted_index":{"We":[0,142],"introduce":[1],"HiT,":[2],"a":[3,17,32,47,73,128],"novel":[4],"hierarchical":[5,33,75,104],"neural":[6],"field":[7],"representation":[8],"for":[9,85],"3D":[10],"shapes":[11,162],"that":[12,68],"learns":[13,39],"general":[14,116],"hierarchies":[15,119],"in":[16,24],"coarse-to-fine":[18],"manner":[19],"across":[20,60],"different":[21],"shape":[22,63,111,149],"categories":[23],"an":[25,147],"unsupervised":[26,148],"setting.":[27],"Our":[28],"key":[29],"contribution":[30],"is":[31],"transformer":[34],"(HIT),":[35],"where":[36,157],"each":[37,93],"level":[38],"parent\u2013child":[40],"relationships":[41,136],"of":[42,90,166],"the":[43,53,70,87,103],"tree":[44,94],"hierarchy":[45],"using":[46],"compressed":[48],"codebook.":[49],"This":[50,96],"codebook":[51],"enables":[52],"network":[54],"to":[55,72,101],"automatically":[56],"identify":[57],"common":[58],"substructures":[59],"potentially":[61],"diverse":[62],"categories.":[64],"Unlike":[65],"previous":[66],"works":[67],"constrain":[69],"task":[71,151],"fixed":[74],"structure":[76,105],"(e.g.,":[77],"binary),":[78],"we":[79],"impose":[80],"no":[81],"such":[82],"restriction,":[83],"except":[84],"limiting":[86],"total":[88],"number":[89],"nodes":[91],"at":[92,125],"level.":[95],"flexibility":[97],"allows":[98],"our":[99,131,158],"method":[100,159],"infer":[102],"directly":[106],"from":[107],"data,":[108],"over":[109,152],"multiple":[110,164],"categories,":[112,156],"and":[113,117,139],"representing":[114],"more":[115],"complex":[118],"than":[120],"prior":[121],"approaches.":[122],"When":[123],"trained":[124],"scale":[126],"with":[127],"reconstruction":[129],"loss,":[130],"model":[132],"captures":[133],"meaningful":[134],"containment":[135],"between":[137],"parent":[138],"child":[140],"nodes.":[141],"demonstrate":[143],"its":[144],"effectiveness":[145],"through":[146],"segmentation":[150],"all":[153],"55":[154],"ShapeNet":[155],"successfully":[160],"segments":[161],"into":[163],"levels":[165],"granularity.":[167],"Project":[168],"Page:":[169],"aditya-vora.github.io/HiT/":[170]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
