{"id":"https://openalex.org/W4317384004","doi":"https://doi.org/10.1109/robio55434.2022.10011669","title":"Learning of 6D Object Poses with Multi-task Point-wise Regression Deep Networks","display_name":"Learning of 6D Object Poses with Multi-task Point-wise Regression Deep Networks","publication_year":2022,"publication_date":"2022-12-05","ids":{"openalex":"https://openalex.org/W4317384004","doi":"https://doi.org/10.1109/robio55434.2022.10011669"},"language":"en","primary_location":{"id":"doi:10.1109/robio55434.2022.10011669","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio55434.2022.10011669","pdf_url":null,"source":{"id":"https://openalex.org/S4363607789","display_name":"2022 IEEE International Conference on Robotics and Biomimetics (ROBIO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072526024","display_name":"Kaixin Bai","orcid":"https://orcid.org/0000-0001-8579-0547"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kaixin Bai","raw_affiliation_strings":["Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics","Agile Robots AG"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics","institution_ids":[]},{"raw_affiliation_string":"Agile Robots AG","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100673610","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0002-7519-2858"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics","Agile Robots AG"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics","institution_ids":[]},{"raw_affiliation_string":"Agile Robots AG","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101705037","display_name":"Zhaopeng Chen","orcid":"https://orcid.org/0000-0003-0375-9146"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhaopeng Chen","raw_affiliation_strings":["Agile Robots AG"],"affiliations":[{"raw_affiliation_string":"Agile Robots AG","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100326970","display_name":"Jianwei Zhang","orcid":"https://orcid.org/0000-0002-7856-5760"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jianwei Zhang","raw_affiliation_strings":["Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics"],"affiliations":[{"raw_affiliation_string":"Universit&#x00E4;t Hamburg,TAMS (Technical Aspects of Multimodal Systems), Department of Informatics","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072526024"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3538,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.53589484,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1603","last_page":"1609"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.8585890531539917},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7838532328605652},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7299245595932007},{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.5863248705863953},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5734752416610718},{"id":"https://openalex.org/keywords/point-cloud","display_name":"Point cloud","score":0.5569121837615967},{"id":"https://openalex.org/keywords/3d-pose-estimation","display_name":"3D pose estimation","score":0.5118407607078552},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5103375315666199},{"id":"https://openalex.org/keywords/rotation","display_name":"Rotation (mathematics)","score":0.4649706184864044},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4418160021305084},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4408065676689148},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4290999472141266},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.411301851272583},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3605117201805115},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3036330044269562}],"concepts":[{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.8585890531539917},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7838532328605652},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7299245595932007},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.5863248705863953},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5734752416610718},{"id":"https://openalex.org/C131979681","wikidata":"https://www.wikidata.org/wiki/Q1899648","display_name":"Point cloud","level":2,"score":0.5569121837615967},{"id":"https://openalex.org/C36613465","wikidata":"https://www.wikidata.org/wiki/Q4636322","display_name":"3D pose estimation","level":3,"score":0.5118407607078552},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5103375315666199},{"id":"https://openalex.org/C74050887","wikidata":"https://www.wikidata.org/wiki/Q848368","display_name":"Rotation (mathematics)","level":2,"score":0.4649706184864044},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4418160021305084},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4408065676689148},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4290999472141266},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.411301851272583},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3605117201805115},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3036330044269562},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio55434.2022.10011669","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio55434.2022.10011669","pdf_url":null,"source":{"id":"https://openalex.org/S4363607789","display_name":"2022 IEEE International Conference on Robotics and Biomimetics (ROBIO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1505952289","https://openalex.org/W1526868886","https://openalex.org/W2033574012","https://openalex.org/W2085261163","https://openalex.org/W2132476906","https://openalex.org/W2160821342","https://openalex.org/W2170940415","https://openalex.org/W2460657278","https://openalex.org/W2499170543","https://openalex.org/W2600030077","https://openalex.org/W2605547838","https://openalex.org/W2770046775","https://openalex.org/W2776330782","https://openalex.org/W2806669929","https://openalex.org/W2885242432","https://openalex.org/W2908326044","https://openalex.org/W2945136467","https://openalex.org/W2949924544","https://openalex.org/W2953127211","https://openalex.org/W2961889961","https://openalex.org/W2963177347","https://openalex.org/W2963188159","https://openalex.org/W2963678509","https://openalex.org/W2963826402","https://openalex.org/W2964266557","https://openalex.org/W2967068439","https://openalex.org/W2968410673","https://openalex.org/W2986303149","https://openalex.org/W2987039068","https://openalex.org/W3009928773","https://openalex.org/W3085853000","https://openalex.org/W3103830808","https://openalex.org/W4236965008","https://openalex.org/W4289489637","https://openalex.org/W4293374772","https://openalex.org/W6743668622","https://openalex.org/W6754677871","https://openalex.org/W6762006211","https://openalex.org/W6763422710","https://openalex.org/W6766446667","https://openalex.org/W6864332406"],"related_works":["https://openalex.org/W3021551196","https://openalex.org/W4320086129","https://openalex.org/W4253893311","https://openalex.org/W3089306886","https://openalex.org/W2113785214","https://openalex.org/W2798721181","https://openalex.org/W3201205132","https://openalex.org/W4387967917","https://openalex.org/W4312694060","https://openalex.org/W4386075737"],"abstract_inverted_index":{"6D":[0,26,48,60,81,118,123,135,173,177],"pose":[1,27,49,61,82,124,136,178],"estimation":[2,28,50,83,125,137],"of":[3,14],"known":[4],"objects":[5],"has":[6],"received":[7],"much":[8],"attention":[9],"for":[10,47,79],"its":[11],"wide":[12],"range":[13],"applications,":[15],"especially":[16],"in":[17,87,130,138,187],"robotic":[18,53,180],"grasping.":[19],"In":[20],"recent":[21],"deep":[22],"learning":[23],"methods,":[24],"the":[25,58,68,71,80,107,110,139,156,171],"problem":[29],"can":[30],"be":[31],"converted":[32],"into":[33],"a":[34,41,52,63,76,88,98,116,150,166],"translation-and-rotation":[35],"regression":[36,45,112],"problem.":[37],"Here":[38],"we":[39,148],"propose":[40,149],"novel":[42],"multi-task":[43],"point-wise":[44],"network":[46,84,95,108,126],"and":[51,62,73,164,190],"grasping":[54,181,186],"system":[55,153],"equipped":[56],"with":[57,101,142],"object":[59,172,185],"grasp":[64],"detector.":[65],"To":[66,133],"reduce":[67],"gap":[69],"between":[70],"estimated":[72],"real":[74,140,191],"poses,":[75],"synthetic":[77],"dataset":[78],"is":[85,113],"generated":[86],"physical":[89],"engine":[90],"using":[91],"domain":[92],"randomization.":[93],"This":[94],"directly":[96],"uses":[97],"point":[99],"cloud":[100],"an":[102],"XYZRGB":[103],"formatted":[104],"input.":[105],"During":[106],"training,":[109],"rotation":[111,119],"evaluated":[114],"by":[115,145],"continuous":[117],"representation.":[120],"The":[121,175],"proposed":[122,176],"outperforms":[127],"high-performance":[128],"networks":[129],"real-world":[131],"experiments.":[132,193],"evaluate":[134],"world":[141],"uncertainty":[143],"introduced":[144],"sensor":[146,157],"noise,":[147],"multi-camera":[151],"vision":[152],"that":[154],"fuses":[155],"data":[158],"from":[159],"three":[160],"RealSense":[161],"D415":[162],"cameras":[163],"develop":[165],"grasp-detection":[167],"algorithm":[168],"based":[169],"on":[170],"pose.":[174],"estimation-based":[179],"framework":[182],"performs":[183],"precise":[184],"both":[188],"simulated":[189],"robot":[192]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
