{"id":"https://openalex.org/W4416749012","doi":"https://doi.org/10.1109/iros60139.2025.11247097","title":"RoboEngine: Plug-and-Play Robot Data Augmentation with Semantic Robot Segmentation and Background Generation","display_name":"RoboEngine: Plug-and-Play Robot Data Augmentation with Semantic Robot Segmentation and Background Generation","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4416749012","doi":"https://doi.org/10.1109/iros60139.2025.11247097"},"language":null,"primary_location":{"id":"doi:10.1109/iros60139.2025.11247097","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247097","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023581735","display_name":"Chengbo Yuan","orcid":"https://orcid.org/0000-0002-9004-0908"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chengbo Yuan","raw_affiliation_strings":["Tsinghua University,Institute for Interdisciplinary Information Sciences"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for Interdisciplinary Information Sciences","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114207298","display_name":"Suraj Joshi","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Suraj Joshi","raw_affiliation_strings":["Tsinghua University,Department of Computer Science and Technology"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Computer Science and Technology","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040608113","display_name":"Shaoting Zhu","orcid":"https://orcid.org/0009-0000-9294-6212"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaoting Zhu","raw_affiliation_strings":["Tsinghua University,Institute for Interdisciplinary Information Sciences"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for Interdisciplinary Information Sciences","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100341893","display_name":"Hang Su","orcid":"https://orcid.org/0000-0003-3365-4361"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hang Su","raw_affiliation_strings":["Tsinghua University,Department of Computer Science and Technology"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Department of Computer Science and Technology","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100418980","display_name":"Hang Zhao","orcid":"https://orcid.org/0000-0002-0482-1573"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hang Zhao","raw_affiliation_strings":["Tsinghua University,Institute for Interdisciplinary Information Sciences"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for Interdisciplinary Information Sciences","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074250521","display_name":"Yang Gao","orcid":"https://orcid.org/0000-0002-2488-1813"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Gao","raw_affiliation_strings":["Tsinghua University,Institute for Interdisciplinary Information Sciences"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Institute for Interdisciplinary Information Sciences","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5023581735"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.44830727,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"7622","last_page":"7629"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.4465999901294708,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.4465999901294708,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.13930000364780426,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.07180000096559525,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.746999979019165},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.659600019454956},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5787000060081482},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3718999922275543},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.32820001244544983},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.30820000171661377},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.30660000443458557},{"id":"https://openalex.org/keywords/visual-servoing","display_name":"Visual servoing","score":0.3009999990463257}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7840999960899353},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.746999979019165},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7390999794006348},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6949999928474426},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.659600019454956},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5787000060081482},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3718999922275543},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.32820001244544983},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.30820000171661377},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.30660000443458557},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.3009999990463257},{"id":"https://openalex.org/C168402607","wikidata":"https://www.wikidata.org/wiki/Q2072119","display_name":"Personal robot","level":5,"score":0.28540000319480896},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.28439998626708984},{"id":"https://openalex.org/C2983761899","wikidata":"https://www.wikidata.org/wiki/Q604674","display_name":"Robot vision","level":4,"score":0.27649998664855957},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C162947575","wikidata":"https://www.wikidata.org/wiki/Q2005645","display_name":"Social robot","level":5,"score":0.2653000056743622},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.26269999146461487},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.260699987411499},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.2596000134944916},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.25589999556541443},{"id":"https://openalex.org/C192299074","wikidata":"https://www.wikidata.org/wiki/Q2160034","display_name":"Robot calibration","level":5,"score":0.25}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros60139.2025.11247097","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros60139.2025.11247097","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322392","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2043547879","https://openalex.org/W2108598243","https://openalex.org/W2443711627","https://openalex.org/W2962766617","https://openalex.org/W2963195169","https://openalex.org/W4312420092","https://openalex.org/W4385430538","https://openalex.org/W4401417065","https://openalex.org/W4402354045","https://openalex.org/W4402354047","https://openalex.org/W4402704543","https://openalex.org/W4402727532","https://openalex.org/W4402754134","https://openalex.org/W4402774769","https://openalex.org/W4402916184","https://openalex.org/W4403337227","https://openalex.org/W4403982072","https://openalex.org/W4405785353","https://openalex.org/W4413155399"],"related_works":[],"abstract_inverted_index":{"Visual":[0],"augmentation":[1,49],"has":[2],"become":[3],"a":[4,66,76,82,89,126,130],"crucial":[5],"technique":[6],"for":[7,30],"enhancing":[8],"the":[9,28,43,52,97,101,108,138,146],"visual":[10,46],"robustness":[11],"of":[12,69,100],"imitation":[13],"learning.":[14],"However,":[15],"existing":[16],"methods":[17],"are":[18,148],"often":[19],"limited":[20],"by":[21],"prerequisites":[22],"such":[23],"as":[24],"camera":[25],"calibration":[26],"or":[27],"need":[29],"controlled":[31],"environments":[32],"(e.g.,":[33],"green":[34],"screen":[35],"setups).":[36],"In":[37],"this":[38],"work,":[39],"we":[40,74,106],"introduce":[41],"RoboEngine,":[42,105],"first":[44,53],"plug-and-play":[45],"robot":[47,62,78,85,112],"data":[48],"toolkit.":[50,103],"For":[51],"time,":[54],"users":[55],"can":[56],"effortlessly":[57],"generate":[58],"physics-":[59],"and":[60,88,145],"task-aware":[61],"scenes":[63],"with":[64],"just":[65],"few":[67],"lines":[68],"code.":[70],"To":[71],"achieve":[72],"this,":[73],"present":[75],"novel":[77],"scene":[79],"segmentation":[80,86],"dataset,":[81],"generalizable":[83],"high-quality":[84],"model,":[87,93],"fine-tuned":[90],"background":[91],"generation":[92],"which":[94],"together":[95],"form":[96],"core":[98],"components":[99],"out-of-the-box":[102],"Using":[104],"demonstrate":[107],"ability":[109],"to":[110,137],"generalize":[111],"manipulation":[113],"tasks":[114],"across":[115],"six":[116],"entirely":[117],"new":[118],"scenes,":[119],"based":[120],"solely":[121],"on":[122],"demonstrations":[123],"collected":[124],"from":[125],"single":[127],"scene,":[128],"achieving":[129],"more":[131],"than":[132],"200%":[133],"performance":[134],"improvement":[135],"compared":[136],"no-augmentation":[139],"baseline.":[140],"All":[141],"datasets,":[142],"model":[143],"weights,":[144],"toolkit":[147],"released":[149],"https://roboengine.github.io/.":[150]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-11-28T00:00:00"}
