{"id":"https://openalex.org/W4312107217","doi":"https://doi.org/10.48550/arxiv.2212.10428","title":"HouseCat6D -- A Large-Scale Multi-Modal Category Level 6D Object Perception Dataset with Household Objects in Realistic Scenarios","display_name":"HouseCat6D -- A Large-Scale Multi-Modal Category Level 6D Object Perception Dataset with Household Objects in Realistic Scenarios","publication_year":2022,"publication_date":"2022-12-20","ids":{"openalex":"https://openalex.org/W4312107217","doi":"https://doi.org/10.48550/arxiv.2212.10428"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2212.10428","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.10428","pdf_url":"https://arxiv.org/pdf/2212.10428","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2212.10428","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030648992","display_name":"Hyunjun Jung","orcid":"https://orcid.org/0000-0002-6717-1395"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jung, HyunJun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043978423","display_name":"Shun\u2010Cheng Wu","orcid":"https://orcid.org/0000-0003-4219-3413"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhai, Guangyao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058704206","display_name":"Patrick Ruhkamp","orcid":"https://orcid.org/0000-0001-6541-3111"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Shun-Cheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055662103","display_name":"Guangyao Zhai","orcid":"https://orcid.org/0000-0002-1527-5387"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruhkamp, Patrick","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020640287","display_name":"Hannah Schieber","orcid":"https://orcid.org/0000-0002-5786-3283"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schieber, Hannah","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070645069","display_name":"Giulia Rizzoli","orcid":"https://orcid.org/0000-0002-1390-8419"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rizzoli, Giulia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100714810","display_name":"Pengyuan Wang","orcid":"https://orcid.org/0000-0002-6444-1257"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Pengyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113164754","display_name":"Hongcheng Zhao","orcid":"https://orcid.org/0009-0005-2944-7011"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Hongcheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014520592","display_name":"Lorenzo Garattoni","orcid":"https://orcid.org/0000-0002-6382-0335"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garattoni, Lorenzo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045305290","display_name":"Sven Meier","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Meier, Sven","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057621778","display_name":"Daniel Roth","orcid":"https://orcid.org/0000-0001-7742-0925"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roth, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046896448","display_name":"Nassir Navab","orcid":"https://orcid.org/0000-0002-6032-5611"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Navab, Nassir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5067135033","display_name":"Benjamin Busam","orcid":"https://orcid.org/0000-0002-0620-5774"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Busam, Benjamin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5030648992"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7357872128486633},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6939164996147156},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.6665596961975098},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6611169576644897},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5740365982055664},{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.5310205817222595},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5143686532974243},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5030283331871033},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4989356994628906},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.4848400354385376},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44745439291000366},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4416847825050354},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.4237891435623169},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34257176518440247},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32738518714904785},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.16014748811721802},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.13031944632530212},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.06600609421730042}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7357872128486633},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6939164996147156},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.6665596961975098},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6611169576644897},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5740365982055664},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.5310205817222595},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5143686532974243},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5030283331871033},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4989356994628906},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.4848400354385376},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44745439291000366},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4416847825050354},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.4237891435623169},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34257176518440247},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32738518714904785},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.16014748811721802},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.13031944632530212},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.06600609421730042},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2212.10428","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.10428","pdf_url":"https://arxiv.org/pdf/2212.10428","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2212.10428","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2212.10428","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2212.10428","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2212.10428","pdf_url":"https://arxiv.org/pdf/2212.10428","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/11","score":0.4000000059604645,"display_name":"Sustainable cities and communities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312107217.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2163296013","https://openalex.org/W2743859443","https://openalex.org/W2326995835","https://openalex.org/W165915117","https://openalex.org/W2059402478","https://openalex.org/W2123347777","https://openalex.org/W4387804363","https://openalex.org/W2477150073","https://openalex.org/W3021551196","https://openalex.org/W627697492"],"abstract_inverted_index":{"Estimating":[0],"6D":[1,47,112],"object":[2],"poses":[3],"is":[4,18],"a":[5,44,106],"major":[6],"challenge":[7],"in":[8,33],"3D":[9],"computer":[10],"vision.":[11],"Building":[12],"on":[13],"successful":[14],"instance-level":[15],"approaches,":[16],"research":[17],"shifting":[19],"towards":[20],"category-level":[21,28,46,124],"pose":[22,37,48,78,125],"estimation":[23,126],"for":[24,122],"practical":[25],"applications.":[26],"Current":[27],"datasets,":[29],"however,":[30],"fall":[31],"short":[32],"annotation":[34],"quality":[35],"and":[36,57,74,102,109],"variety.":[38],"Addressing":[39],"this,":[40],"we":[41,118],"introduce":[42],"HouseCat6D,":[43],"new":[45],"dataset.":[49],"It":[50],"features":[51],"1)":[52],"multi-modality":[53],"with":[54,80,99],"Polarimetric":[55],"RGB":[56],"Depth":[58],"(RGBD+P),":[59],"2)":[60],"encompasses":[61],"194":[62],"diverse":[63],"objects":[64],"across":[65],"10":[66],"household":[67],"categories,":[68],"including":[69],"two":[70],"photometrically":[71],"challenging":[72],"ones,":[73],"3)":[75],"provides":[76],"high-quality":[77],"annotations":[79],"an":[81],"error":[82],"range":[83],"of":[84],"only":[85],"1.35":[86],"mm":[87],"to":[88],"1.74":[89],"mm.":[90],"The":[91],"dataset":[92],"also":[93],"includes":[94],"4)":[95],"41":[96],"large-scale":[97],"scenes":[98],"comprehensive":[100],"viewpoint":[101],"occlusion":[103],"coverage,":[104],"5)":[105],"checkerboard-free":[107],"environment,":[108],"6)":[110],"dense":[111],"parallel-jaw":[113],"robotic":[114],"grasp":[115],"annotations.":[116],"Additionally,":[117],"present":[119],"benchmark":[120],"results":[121],"leading":[123],"networks.":[127]},"counts_by_year":[{"year":2024,"cited_by_count":3}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2023-01-04T00:00:00"}
