{"id":"https://openalex.org/W4312340851","doi":"https://doi.org/10.1109/icdl53763.2022.9962232","title":"Disentangling Patterns and Transformations from One Sequence of Images with Shape-invariant Lie Group Transformer","display_name":"Disentangling Patterns and Transformations from One Sequence of Images with Shape-invariant Lie Group Transformer","publication_year":2022,"publication_date":"2022-09-12","ids":{"openalex":"https://openalex.org/W4312340851","doi":"https://doi.org/10.1109/icdl53763.2022.9962232"},"language":"en","primary_location":{"id":"doi:10.1109/icdl53763.2022.9962232","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdl53763.2022.9962232","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056078233","display_name":"Takumi Takada","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Takumi Takada","raw_affiliation_strings":["The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","School of Information Science and Technology, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"School of Information Science and Technology, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067318506","display_name":"Wataru Shimaya","orcid":"https://orcid.org/0009-0005-4524-8514"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Wataru Shimaya","raw_affiliation_strings":["The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","School of Information Science and Technology, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"School of Information Science and Technology, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019675297","display_name":"Yoshiyuki Ohmura","orcid":"https://orcid.org/0000-0002-9158-5360"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yoshiyuki Ohmura","raw_affiliation_strings":["The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","School of Information Science and Technology, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"School of Information Science and Technology, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010543059","display_name":"Yasuo Kuniyoshi","orcid":"https://orcid.org/0000-0001-8443-4161"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yasuo Kuniyoshi","raw_affiliation_strings":["The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","Next Generation Artificial Intelligence Research Center (AI Center), The University of Tokyo, Tokyo, Japan","School of Information Science and Technology, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"The University of Tokyo,School of Information Science and Technology,Tokyo,Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"Next Generation Artificial Intelligence Research Center (AI Center), The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"School of Information Science and Technology, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5056078233"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.302,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.55397976,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"54","last_page":"59"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/invariant","display_name":"Invariant (physics)","score":0.660939633846283},{"id":"https://openalex.org/keywords/lie-group","display_name":"Lie group","score":0.6100163459777832},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5962315797805786},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5086158514022827},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4389404356479645},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40535563230514526},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.37264901399612427},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.33831727504730225},{"id":"https://openalex.org/keywords/algebra-over-a-field","display_name":"Algebra over a field","score":0.3324856758117676},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.33098480105400085},{"id":"https://openalex.org/keywords/pure-mathematics","display_name":"Pure mathematics","score":0.27720385789871216}],"concepts":[{"id":"https://openalex.org/C190470478","wikidata":"https://www.wikidata.org/wiki/Q2370229","display_name":"Invariant (physics)","level":2,"score":0.660939633846283},{"id":"https://openalex.org/C187915474","wikidata":"https://www.wikidata.org/wiki/Q622679","display_name":"Lie group","level":2,"score":0.6100163459777832},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5962315797805786},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5086158514022827},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4389404356479645},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40535563230514526},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37264901399612427},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33831727504730225},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.3324856758117676},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33098480105400085},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.27720385789871216},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdl53763.2022.9962232","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdl53763.2022.9962232","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320317988","display_name":"Artificial Intelligence Research Center","ror":null},{"id":"https://openalex.org/F4320322832","display_name":"University of Tokyo","ror":"https://ror.org/057zh3y96"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4310420093","https://openalex.org/W3154635860","https://openalex.org/W4226332880","https://openalex.org/W4298054035","https://openalex.org/W4200631625","https://openalex.org/W4307377619","https://openalex.org/W1620410898","https://openalex.org/W4226138400","https://openalex.org/W3026007073","https://openalex.org/W4378718358"],"abstract_inverted_index":{"An":[0],"effective":[1],"way":[2],"to":[3,10,39,83,120,165],"model":[4,178,229],"the":[5,12,29,32,60,63,105,109,121,126,134,149,167,181,184,203,227,232,242],"complex":[6],"real":[7,33],"world":[8,13,61,107],"is":[9,36,108],"view":[11],"as":[14,133,141,209],"a":[15,44,71,76,89,98,177],"composition":[16],"of":[17,20,31,59,79,111,123,128,187,190,199,218],"basic":[18,188],"components":[19,189],"objects":[21,223,235],"and":[22,100,115,163,192,236],"transformations.":[23],"Although":[24],"humans":[25],"through":[26],"development":[27],"understand":[28],"compositionality":[30],"world,":[34],"it":[35],"extremely":[37],"difficult":[38],"equip":[40],"robots":[41],"with":[42,158,169],"such":[43,84,140],"learning":[45,57,95],"mechanism.":[46],"In":[47],"recent":[48],"years,":[49],"there":[50],"has":[51],"been":[52],"significant":[53],"research":[54],"on":[55,97,172],"autonomously":[56],"representations":[58],"using":[62],"deep":[64],"learning;":[65],"however,":[66],"most":[67],"studies":[68],"have":[69],"taken":[70],"statistical":[72],"approach,":[73],"which":[74,221],"requires":[75],"large":[77],"number":[78,186],"training":[80],"data.":[81],"Contrary":[82],"existing":[85],"methods,":[86],"we":[87,145,175],"take":[88],"novel":[90],"algebraic":[91],"approach":[92],"for":[93],"representation":[94],"based":[96],"simpler":[99],"more":[101],"intuitive":[102],"formulation":[103],"that":[104,117,148,179,214,240],"observed":[106],"combination":[110],"multiple":[112,237],"independent":[113],"patterns":[114,129,150,191],"transformations":[116,139,157,194,239],"are":[118,224],"invariant":[119,135],"shape":[122,127],"patterns.":[124],"Since":[125],"can":[130,146,151,230],"be":[131,153],"viewed":[132],"features":[136],"against":[137],"symmetric":[138,159],"translation":[142],"or":[143],"rotation,":[144],"expect":[147],"naturally":[152],"extracted":[154],"by":[155,201],"expressing":[156],"Lie":[160,193,206],"group":[161,207],"transformers":[162,208],"attempting":[164],"reconstruct":[166],"scene":[168],"them.":[170],"Based":[171],"this":[173],"idea,":[174],"propose":[176],"disentangles":[180],"scenes":[182],"into":[183],"minimum":[185],"from":[195],"only":[196],"one":[197,216],"sequence":[198,217],"images,":[200],"introducing":[202],"learnable":[204],"shape-invariant":[205,238],"transformation":[210],"components.":[211],"Experiments":[212],"show":[213],"given":[215],"images":[219],"in":[220],"two":[222],"moving":[225],"independently,":[226],"proposed":[228],"discover":[231],"hidden":[233],"distinct":[234],"constitute":[241],"scenes.":[243]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
