{"id":"https://openalex.org/W2965396565","doi":"https://doi.org/10.3390/make1030051","title":"Deep Learning Based Object Recognition Using Physically-Realistic Synthetic Depth Scenes","display_name":"Deep Learning Based Object Recognition Using Physically-Realistic Synthetic Depth Scenes","publication_year":2019,"publication_date":"2019-08-06","ids":{"openalex":"https://openalex.org/W2965396565","doi":"https://doi.org/10.3390/make1030051","mag":"2965396565"},"language":"en","primary_location":{"id":"doi:10.3390/make1030051","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1030051","pdf_url":"https://www.mdpi.com/2504-4990/1/3/51/pdf?version=1565094551","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2504-4990/1/3/51/pdf?version=1565094551","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5082502206","display_name":"Daulet Baimukashev","orcid":"https://orcid.org/0000-0002-1432-8205"},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Daulet Baimukashev","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":"https://orcid.org/0000-0002-1432-8205","affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022738654","display_name":"Alikhan Zhilisbayev","orcid":null},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Alikhan Zhilisbayev","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024720741","display_name":"Askat Kuzdeuov","orcid":"https://orcid.org/0000-0001-6169-8252"},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Askat Kuzdeuov","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":"https://orcid.org/0000-0001-6169-8252","affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031356551","display_name":"Artemiy Oleinikov","orcid":"https://orcid.org/0000-0003-3064-6104"},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Artemiy Oleinikov","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076908321","display_name":"Denis Fadeyev","orcid":null},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Denis Fadeyev","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091740767","display_name":"Zhanat Makhataeva","orcid":"https://orcid.org/0000-0001-9366-7047"},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":false,"raw_author_name":"Zhanat Makhataeva","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044782949","display_name":"H\u00fcseyin Atakan Varol","orcid":"https://orcid.org/0000-0002-4042-425X"},"institutions":[{"id":"https://openalex.org/I60559429","display_name":"Nazarbayev University","ror":"https://ror.org/052bx8q98","country_code":"KZ","type":"education","lineage":["https://openalex.org/I60559429"]}],"countries":["KZ"],"is_corresponding":true,"raw_author_name":"Huseyin Atakan Varol","raw_affiliation_strings":["Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan"],"raw_orcid":"https://orcid.org/0000-0002-4042-425X","affiliations":[{"raw_affiliation_string":"Department of Robotics, Nazarbayev University, 53 Kabanbay batyr Ave., Astana Z05H0P9, Kazakhstan","institution_ids":["https://openalex.org/I60559429"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5044782949"],"corresponding_institution_ids":["https://openalex.org/I60559429"],"apc_list":{"value":1400,"currency":"CHF","value_usd":1515},"apc_paid":{"value":1400,"currency":"CHF","value_usd":1515},"fwci":0.5106,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.69315531,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"1","issue":"3","first_page":"883","last_page":"903"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.8960455656051636},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7642294764518738},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.7314887046813965},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6614305377006531},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6205306649208069},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5783844590187073},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.560337245464325},{"id":"https://openalex.org/keywords/grasp","display_name":"GRASP","score":0.5189220905303955},{"id":"https://openalex.org/keywords/cognitive-neuroscience-of-visual-object-recognition","display_name":"Cognitive neuroscience of visual object recognition","score":0.4940200448036194},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4682140350341797},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.4540163278579712},{"id":"https://openalex.org/keywords/orientation","display_name":"Orientation (vector space)","score":0.4196779131889343},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4164389967918396},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07503503561019897}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.8960455656051636},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7642294764518738},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.7314887046813965},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6614305377006531},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6205306649208069},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5783844590187073},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.560337245464325},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.5189220905303955},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.4940200448036194},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4682140350341797},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.4540163278579712},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.4196779131889343},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4164389967918396},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07503503561019897},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/make1030051","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1030051","pdf_url":"https://www.mdpi.com/2504-4990/1/3/51/pdf?version=1565094551","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},{"id":"pmh:oai:mdpi.com:/2504-4990/1/3/51/","is_oa":true,"landing_page_url":"http://dx.doi.org/10.3390/make1030051","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/make1030051","is_oa":true,"landing_page_url":"https://doi.org/10.3390/make1030051","pdf_url":"https://www.mdpi.com/2504-4990/1/3/51/pdf?version=1565094551","source":{"id":"https://openalex.org/S4210213891","display_name":"Machine Learning and Knowledge Extraction","issn_l":"2504-4990","issn":["2504-4990"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning and Knowledge Extraction","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.7200000286102295,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2965396565.pdf","grobid_xml":"https://content.openalex.org/works/W2965396565.grobid-xml"},"referenced_works_count":59,"referenced_works":["https://openalex.org/W156975732","https://openalex.org/W639708223","https://openalex.org/W1731081199","https://openalex.org/W1949568868","https://openalex.org/W1972292376","https://openalex.org/W1984475609","https://openalex.org/W1985231173","https://openalex.org/W1987648924","https://openalex.org/W2031489346","https://openalex.org/W2049116836","https://openalex.org/W2060613652","https://openalex.org/W2087477843","https://openalex.org/W2095639956","https://openalex.org/W2097117768","https://openalex.org/W2099160252","https://openalex.org/W2099940712","https://openalex.org/W2102605133","https://openalex.org/W2109992539","https://openalex.org/W2127725869","https://openalex.org/W2128359381","https://openalex.org/W2131953535","https://openalex.org/W2133803071","https://openalex.org/W2147629985","https://openalex.org/W2156222070","https://openalex.org/W2160890830","https://openalex.org/W2163605009","https://openalex.org/W2167340365","https://openalex.org/W2172156083","https://openalex.org/W2193145675","https://openalex.org/W2194775991","https://openalex.org/W2343052201","https://openalex.org/W2529170537","https://openalex.org/W2529729570","https://openalex.org/W2557728737","https://openalex.org/W2563100679","https://openalex.org/W2591690290","https://openalex.org/W2593957897","https://openalex.org/W2604662268","https://openalex.org/W2618530766","https://openalex.org/W2650354119","https://openalex.org/W2770201929","https://openalex.org/W2780351918","https://openalex.org/W2798936443","https://openalex.org/W2805661097","https://openalex.org/W2919115771","https://openalex.org/W2952213706","https://openalex.org/W2952302849","https://openalex.org/W2953240077","https://openalex.org/W2962759496","https://openalex.org/W2962837662","https://openalex.org/W2963037989","https://openalex.org/W2963231598","https://openalex.org/W2963271314","https://openalex.org/W2963956866","https://openalex.org/W2964271185","https://openalex.org/W2964350391","https://openalex.org/W3101196391","https://openalex.org/W3106250896","https://openalex.org/W6637618735"],"related_works":["https://openalex.org/W2163296013","https://openalex.org/W165915117","https://openalex.org/W2326995835","https://openalex.org/W2743859443","https://openalex.org/W2059402478","https://openalex.org/W2123347777","https://openalex.org/W4387804363","https://openalex.org/W2477150073","https://openalex.org/W2969228573","https://openalex.org/W4387272257"],"abstract_inverted_index":{"Recognizing":[0],"objects":[1,26,117,135],"and":[2,23,79,94,131,161,188,225,254,263],"estimating":[3],"their":[4],"poses":[5],"have":[6],"a":[7,34,52,68,97,103,111,121,154,167,237],"wide":[8],"range":[9],"of":[10,25,40,71,74,96,115,156,173],"application":[11],"in":[12,27,33,64,120,236],"robotics.":[13],"For":[14],"instance,":[15],"to":[16,45,50,211,249],"grasp":[17],"objects,":[18],"robots":[19],"need":[20],"the":[21,92,184,191,196,205,232,247,252,259],"position":[22],"orientation":[24],"3D.":[28],"The":[29,213],"task":[30],"becomes":[31],"challenging":[32],"cluttered":[35,65,238],"environment":[36],"with":[37,136,200],"different":[38],"types":[39],"objects.":[41],"A":[42],"popular":[43],"approach":[44],"tackle":[46],"this":[47,87],"problem":[48],"is":[49],"utilize":[51],"deep":[53,60,98,197,243],"neural":[54],"network":[55],"for":[56,83,151,208,228,258],"object":[57,62,99,177,214,229,244],"recognition.":[58],"However,":[59],"learning-based":[61],"detection":[63,181,215,245],"environments":[66],"requires":[67,77],"substantial":[69],"amount":[70],"data.":[72],"Collection":[73],"these":[75],"data":[76,235,261],"time":[78,253],"extensive":[80,260],"human":[81,255],"labor":[82],"manual":[84],"labeling.":[85,264],"In":[86],"study,":[88],"our":[89],"objective":[90],"was":[91,149,164],"development":[93],"validation":[95],"recognition":[100,206,230],"framework":[101,216],"using":[102,153],"synthetic":[104,158,192,202],"depth":[105,112,159,169,186,193,223,234,241],"image":[106,113,170],"dataset.":[107],"We":[108],"synthetically":[109,221],"generated":[110,222],"dataset":[114,155,171],"22":[116],"randomly":[118],"placed":[119],"0.5":[122,125],"m":[123,126,129],"\u00d7":[124,127],"0.1":[128],"box,":[130],"automatically":[132],"labeled":[133],"all":[134],"an":[137],"occlusion":[138],"rate":[139],"below":[140],"70%.":[141],"Faster":[142],"Region":[143],"Convolutional":[144],"Neural":[145],"Network":[146],"(R-CNN)":[147],"architecture":[148],"adopted":[150],"training":[152],"800,000":[157],"images,":[160],"its":[162],"performance":[163],"tested":[165],"on":[166,183,190,220,231],"real-world":[168],"consisting":[172],"2000":[174],"samples.":[175],"Deep":[176],"recognizer":[178],"has":[179,246],"40.96%":[180],"accuracy":[182,207],"real":[185,209,233],"images":[187,203,210],"93.5%":[189],"images.":[194],"Training":[195],"learning":[198],"model":[199],"noise-added":[201],"improves":[204],"46.3%.":[212],"can":[217],"be":[218],"trained":[219],"data,":[224],"then":[226],"employed":[227],"environment.":[239],"Synthetic":[240],"data-based":[242],"potential":[248],"substantially":[250],"decrease":[251],"effort":[256],"required":[257],"collection":[262]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
