{"id":"https://openalex.org/W4312521235","doi":"https://doi.org/10.1109/iros47612.2022.9981907","title":"Self-supervised Wide Baseline Visual Servoing via 3D Equivariance","display_name":"Self-supervised Wide Baseline Visual Servoing via 3D Equivariance","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W4312521235","doi":"https://doi.org/10.1109/iros47612.2022.9981907"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9981907","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981907","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000951599","display_name":"Jinwook Huh","orcid":"https://orcid.org/0000-0002-1550-6632"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jinwook Huh","raw_affiliation_strings":["Samsung AI Center NY,New York,NY,10014"],"affiliations":[{"raw_affiliation_string":"Samsung AI Center NY,New York,NY,10014","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110745295","display_name":"Jungseok Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jungseok Hong","raw_affiliation_strings":["Samsung AI Center NY,New York,NY,10014"],"affiliations":[{"raw_affiliation_string":"Samsung AI Center NY,New York,NY,10014","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041458715","display_name":"Suveer Garg","orcid":"https://orcid.org/0000-0001-5752-8760"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Suveer Garg","raw_affiliation_strings":["Samsung AI Center NY,New York,NY,10014"],"affiliations":[{"raw_affiliation_string":"Samsung AI Center NY,New York,NY,10014","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101538702","display_name":"Hyun Soo Park","orcid":"https://orcid.org/0000-0001-6613-0738"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hyun Soo Park","raw_affiliation_strings":["Samsung AI Center NY,New York,NY,10014"],"affiliations":[{"raw_affiliation_string":"Samsung AI Center NY,New York,NY,10014","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033839227","display_name":"Volkan Isler","orcid":"https://orcid.org/0000-0002-0868-5441"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Volkan Isler","raw_affiliation_strings":["Samsung AI Center NY,New York,NY,10014"],"affiliations":[{"raw_affiliation_string":"Samsung AI Center NY,New York,NY,10014","institution_ids":["https://openalex.org/I4210101778"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5000951599"],"corresponding_institution_ids":["https://openalex.org/I4210101778"],"apc_list":null,"apc_paid":null,"fwci":0.1199,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.43968345,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"2227","last_page":"2233"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10638","display_name":"Optical measurement and interference techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/visual-servoing","display_name":"Visual servoing","score":0.9386734366416931},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7234474420547485},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.716474175453186},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.626904308795929},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5396655797958374},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.5165656805038452},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.5164408683776855},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.48477238416671753},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4452567398548126},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2745479345321655}],"concepts":[{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.9386734366416931},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7234474420547485},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.716474175453186},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.626904308795929},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5396655797958374},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.5165656805038452},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.5164408683776855},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.48477238416671753},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4452567398548126},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2745479345321655},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros47612.2022.9981907","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9981907","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1526868886","https://openalex.org/W1607376109","https://openalex.org/W1612997784","https://openalex.org/W2082991751","https://openalex.org/W2129000642","https://openalex.org/W2151103935","https://openalex.org/W2167501464","https://openalex.org/W2194775991","https://openalex.org/W2198618282","https://openalex.org/W2200124539","https://openalex.org/W2522940611","https://openalex.org/W2535547924","https://openalex.org/W2592936284","https://openalex.org/W2605048551","https://openalex.org/W2620115845","https://openalex.org/W2795645133","https://openalex.org/W2910687636","https://openalex.org/W2922243907","https://openalex.org/W2940957385","https://openalex.org/W2962783853","https://openalex.org/W2963150697","https://openalex.org/W2963188159","https://openalex.org/W2996058491","https://openalex.org/W3003339604","https://openalex.org/W3045988483","https://openalex.org/W3049043369","https://openalex.org/W3092152581","https://openalex.org/W3102327032","https://openalex.org/W3133026276","https://openalex.org/W3147149346","https://openalex.org/W4207020220","https://openalex.org/W4289489637","https://openalex.org/W4301151840","https://openalex.org/W6629652696","https://openalex.org/W6736178813","https://openalex.org/W6738940082","https://openalex.org/W6754677871","https://openalex.org/W6772286975"],"related_works":["https://openalex.org/W2126852585","https://openalex.org/W2367086100","https://openalex.org/W2352270872","https://openalex.org/W1520171478","https://openalex.org/W2386520554","https://openalex.org/W4317830657","https://openalex.org/W2127866683","https://openalex.org/W3024380338","https://openalex.org/W2065095941","https://openalex.org/W2637148753"],"abstract_inverted_index":{"One":[0],"of":[1,76,82,112],"the":[2,11,25,77,80,118,123,136,156,159,168,171,189],"challenging":[3],"input":[4],"settings":[5,21],"for":[6,47,178],"visual":[7,44,92,180,197],"servoing":[8,45,198],"is":[9,103,120,131,184],"when":[10],"initial":[12],"and":[13,35,174,222],"goal":[14],"camera":[15,64],"views":[16],"are":[17,22],"far":[18],"apart.":[19],"Such":[20],"difficult":[23],"because":[24],"wide":[26,48],"baseline":[27,49],"can":[28,144,162],"cause":[29,36],"drastic":[30],"changes":[31],"in":[32,79,105,133,170],"object":[33,70,78,201],"appearance":[34],"occlusions.":[37],"This":[38],"paper":[39],"presents":[40],"a":[41,90,96,106,110,127,140,196],"novel":[42],"self-supervised":[43],"method":[46,183],"images":[50],"which":[51],"does":[52],"not":[53],"require":[54,71],"3D":[55,72,83,100,113,153,211],"ground":[56,73],"truth":[57,74],"supervision.":[58,154,212],"Existing":[59],"approaches":[60,208],"that":[61,117,143,209],"regress":[62],"absolute":[63],"pose":[65],"with":[66,135,204,228],"respect":[67,205],"to":[68,122,206],"an":[69],"data":[75],"forms":[81],"bounding":[84],"boxes":[85],"or":[86,200],"meshes.":[87],"We":[88,138],"learn":[89],"coherent":[91],"representation":[93,102],"by":[94,166],"leveraging":[95],"geometric":[97,149],"property":[98],"called":[99],"equivariance\u2014the":[101],"transformed":[104],"predictable":[107],"way":[108],"as":[109,176],"function":[111],"transformation.":[114],"To":[115],"ensure":[116],"feature-space":[119],"faithful":[121],"underlying":[124],"geodesic":[125,128],"space,":[126],"preserving":[129],"constraint":[130],"applied":[132],"conjunction":[134],"equivariance.":[137],"design":[139],"Siamese":[141],"network":[142],"effectively":[145],"enforce":[146],"these":[147],"two":[148],"properties":[150],"without":[151],"requiring":[152],"With":[155],"learned":[157,172],"model,":[158],"relative":[160],"transformation":[161],"be":[163],"inferred":[164],"simply":[165],"following":[167],"gradient":[169],"space":[173],"used":[175],"feedback":[177],"closed-loop":[179],"servoing.":[181],"Our":[182],"evaluated":[185],"on":[186,195],"objects":[187],"from":[188],"YCB":[190],"dataset,":[191],"showing":[192],"meaningful":[193],"outperformance":[194],"task,":[199],"alignment":[202],"task":[203],"state-of-the-art":[207],"use":[210],"Ours":[213],"yields":[214],"more":[215,223],"than":[216,224],"35%":[217],"average":[218],"distance":[219],"error":[220,230],"reduction":[221],"90%":[225],"success":[226],"rate":[227],"3cm":[229],"tolerance.":[231]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
