{"id":"https://openalex.org/W7162635487","doi":"https://doi.org/10.48550/arxiv.2605.27938","title":"SEMAGIC: Learning Semantically Consistent Deformable 3D Representations from In-the-Wild Images","display_name":"SEMAGIC: Learning Semantically Consistent Deformable 3D Representations from In-the-Wild Images","publication_year":2026,"publication_date":"2026-05-27","ids":{"openalex":"https://openalex.org/W7162635487","doi":"https://doi.org/10.48550/arxiv.2605.27938"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27938","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137281547","display_name":"Sky Cen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cen, Sky","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070188278","display_name":"Wufei Ma","orcid":"https://orcid.org/0000-0002-4696-2833"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Wufei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137212645","display_name":"Guofeng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Guofeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137294385","display_name":"Alan Yuille","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuille, Alan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084928022","display_name":"Adam Kortylewski","orcid":"https://orcid.org/0000-0002-9146-4403"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kortylewski, Adam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.921500027179718,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.921500027179718,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.017799999564886093,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.013100000098347664,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6184999942779541},{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.5586000084877014},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5063999891281128},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.45829999446868896},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.3887999951839447},{"id":"https://openalex.org/keywords/semantic-property","display_name":"Semantic property","score":0.3833000063896179},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3828999996185303},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.37229999899864197}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6628999710083008},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6345000267028809},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6184999942779541},{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.5586000084877014},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5063999891281128},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4675999879837036},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41909998655319214},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.3887999951839447},{"id":"https://openalex.org/C198942812","wikidata":"https://www.wikidata.org/wiki/Q496618","display_name":"Semantic property","level":2,"score":0.3833000063896179},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3828999996185303},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C204366326","wikidata":"https://www.wikidata.org/wiki/Q3027650","display_name":"Deformation (meteorology)","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.3212999999523163},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2897999882698059},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C131584629","wikidata":"https://www.wikidata.org/wiki/Q4308705","display_name":"Coupling (piping)","level":2,"score":0.26080000400543213}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27938","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27938","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Learning":[0],"deformable":[1,36,65,82,183,191],"3D":[2,12,66,196],"object":[3],"models":[4,23,184,192],"from":[5,68,114],"single-view":[6,69],"in-the-wild":[7,70],"images":[8],"has":[9],"enabled":[10],"impressive":[11],"shape":[13],"reconstruction":[14,37,75],"without":[15],"supervision.":[16],"However,":[17],"it":[18],"remains":[19],"unclear":[20],"whether":[21],"these":[22],"capture":[24],"the":[25,77],"semantic":[26,53,122,139,152,162,180,195],"structure":[27],"required":[28],"for":[29,61],"downstream":[30],"tasks.":[31],"We":[32,56],"find":[33],"that":[34,110,150,167,177],"existing":[35],"approaches,":[38],"despite":[39],"producing":[40],"visually":[41],"plausible":[42],"geometry,":[43],"yield":[44],"unstable":[45],"correspondences":[46,171],"across":[47,124,154,172],"instances":[48],"and":[49,100,143,146],"perform":[50],"poorly":[51],"on":[52,188],"correspondence":[54,153,181],"benchmarks.":[55],"introduce":[57],"SEMAGIC,":[58],"a":[59,85,96,101,134],"framework":[60],"learning":[62],"semantically":[63],"consistent":[64,121],"representations":[67,166],"images.":[71],"Rather":[72],"than":[73],"treating":[74],"as":[76,84,193],"end":[78],"goal,":[79],"SEMAGIC":[80,164,178],"uses":[81],"modeling":[83],"mechanism":[86],"to":[87,107,119],"discover":[88],"category-level":[89],"correspondences.":[90],"Each":[91],"category":[92],"is":[93,128],"represented":[94],"by":[95,185],"canonical":[97,142],"template":[98],"mesh":[99],"learned":[102],"deformation":[103,149,160],"field,":[104],"functioning":[105],"similarly":[106],"an":[108],"autoencoder":[109],"reconstructs":[111],"instance":[112],"geometry":[113],"image":[115],"features,":[116],"enabling":[117],"vertices":[118],"maintain":[120,168],"meaning":[123],"instances.":[125,155],"Semantic":[126],"consistency":[127,136],"enforced":[129],"during":[130],"training":[131],"through":[132],"(i)":[133],"feature-level":[135],"loss":[137],"aligning":[138],"features":[140],"between":[141],"deformed":[144],"meshes,":[145],"(ii)":[147],"vertex-index-conditioned":[148],"preserves":[151],"By":[156],"explicitly":[157],"coupling":[158],"geometric":[159],"with":[161],"alignment,":[163],"produces":[165],"stable":[169],"part":[170],"intra-category":[173],"variation.":[174],"Experiments":[175],"demonstrate":[176],"improves":[179],"of":[182],"+14.7":[186],"PCK@0.1":[187],"SPair-71k,":[189],"establishing":[190],"effective":[194],"representations.":[197]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-29T00:00:00"}
