{"id":"https://openalex.org/W7136174797","doi":"https://doi.org/10.48550/arxiv.2603.12918","title":"VIRD: View-Invariant Representation through Dual-Axis Transformation for Cross-View Pose Estimation","display_name":"VIRD: View-Invariant Representation through Dual-Axis Transformation for Cross-View Pose Estimation","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7136174797","doi":"https://doi.org/10.48550/arxiv.2603.12918"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.12918","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12918","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.12918","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129449049","display_name":"Juhye Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Juhye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082844857","display_name":"Wooju Lee","orcid":"https://orcid.org/0000-0002-3388-3765"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Wooju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044688731","display_name":"Dasol Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Dasol","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021044069","display_name":"Changki Sung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sung, Changki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129584650","display_name":"Youngwoo Seo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seo, Youngwoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129482639","display_name":"Dongwan Kang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kang, Dongwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129534943","display_name":"Hyun Myung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Myung, Hyun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9732000231742859,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.010900000110268593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.002899999963119626,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.7515000104904175},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.7339000105857849},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.6773999929428101},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6057999730110168},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.49880000948905945},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.48829999566078186},{"id":"https://openalex.org/keywords/satellite","display_name":"Satellite","score":0.4593999981880188},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.44909998774528503}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7616000175476074},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7581999897956848},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.7515000104904175},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.7339000105857849},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.6773999929428101},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6474999785423279},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6057999730110168},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.49880000948905945},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.48829999566078186},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.4593999981880188},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.44909998774528503},{"id":"https://openalex.org/C161218011","wikidata":"https://www.wikidata.org/wiki/Q11827794","display_name":"Multipath propagation","level":3,"score":0.3452000021934509},{"id":"https://openalex.org/C80551277","wikidata":"https://www.wikidata.org/wiki/Q11210","display_name":"Coordinate system","level":2,"score":0.3276999890804291},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.32420000433921814},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.31139999628067017},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28839999437332153},{"id":"https://openalex.org/C2780297707","wikidata":"https://www.wikidata.org/wiki/Q4895393","display_name":"Landmark","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27790001034736633},{"id":"https://openalex.org/C22100474","wikidata":"https://www.wikidata.org/wiki/Q4800952","display_name":"Articulated body pose estimation","level":4,"score":0.2662000060081482},{"id":"https://openalex.org/C126795593","wikidata":"https://www.wikidata.org/wiki/Q7333813","display_name":"Rigid transformation","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C2776717989","wikidata":"https://www.wikidata.org/wiki/Q19410276","display_name":"FREAK","level":2,"score":0.26420000195503235},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.12918","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12918","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.12918","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.12918","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"global":[1],"localization":[2],"is":[3],"critical":[4],"for":[5],"autonomous":[6],"driving":[7],"and":[8,18,58,105,137,144,160,165,169,171],"robotics,":[9],"but":[10],"GNSS-based":[11],"approaches":[12],"often":[13],"degrade":[14],"due":[15,62],"to":[16,34,40,49,63,89,93,109,133],"occlusion":[17],"multipath":[19],"effects.":[20],"As":[21],"an":[22],"emerging":[23],"alternative,":[24],"cross-view":[25,71,138],"pose":[26,32,72],"estimation":[27,73],"predicts":[28],"the":[29,51,56,90,103,115,130,135,142,151],"3-DoF":[30],"camera":[31],"corresponding":[33],"a":[35,41,69,86,125],"ground-view":[36],"image":[37],"with":[38],"respect":[39],"geo-referenced":[42],"satellite":[43,59,91,107],"image.":[44],"However,":[45],"existing":[46],"methods":[47,153],"struggle":[48],"bridge":[50],"significant":[52],"viewpoint":[53,116],"gap":[54],"between":[55],"ground":[57,104],"views":[60],"mainly":[61],"limited":[64],"spatial":[65],"correspondences.":[66],"We":[67],"propose":[68],"novel":[70],"method":[74],"that":[75,128,148],"constructs":[76],"view-invariant":[77],"representations":[78,132],"through":[79],"dual-axis":[80],"transformation":[81,88],"(VIRD).":[82],"VIRD":[83,149],"first":[84],"applies":[85],"polar":[87],"view":[92,121],"facilitate":[94],"horizontal":[95],"correspondence,":[96],"then":[97],"uses":[98],"context-enhanced":[99],"positional":[100],"attention":[101],"on":[102,141,167,173],"polar-transformed":[106],"features":[108],"mitigate":[110],"vertical":[111],"misalignment,":[112],"explicitly":[113],"bridging":[114],"gap.":[117],"To":[118],"further":[119],"strengthen":[120],"invariance,":[122],"we":[123],"introduce":[124],"view-reconstruction":[126],"loss":[127],"encourages":[129],"derived":[131],"reconstruct":[134],"original":[136],"images.":[139],"Experiments":[140],"KITTI":[143],"VIGOR":[145],"datasets":[146],"demonstrate":[147],"outperforms":[150],"state-of-the-art":[152],"without":[154],"orientation":[155,161],"priors,":[156],"reducing":[157],"median":[158],"position":[159],"errors":[162],"by":[163],"50.7%":[164],"76.5%":[166],"KITTI,":[168],"18.0%":[170],"46.8%":[172],"VIGOR,":[174],"respectively.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-17T00:00:00"}
