{"id":"https://openalex.org/W4415288097","doi":"https://doi.org/10.48550/arxiv.2503.15918","title":"Denoising-based Contractive Imitation Learning","display_name":"Denoising-based Contractive Imitation Learning","publication_year":2025,"publication_date":"2025-03-20","ids":{"openalex":"https://openalex.org/W4415288097","doi":"https://doi.org/10.48550/arxiv.2503.15918"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2503.15918","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15918","pdf_url":"https://arxiv.org/pdf/2503.15918","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.15918","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Shen, Macheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Macheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041244560","display_name":"Jishen Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Jishen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5109725008","display_name":"Zefang Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Zefang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9204999804496765,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9204999804496765,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9132999777793884,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5266000032424927},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.522599995136261},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.48570001125335693},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4440999925136566},{"id":"https://openalex.org/keywords/covariate","display_name":"Covariate","score":0.3978999853134155},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.3718999922275543},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.34130001068115234}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6414999961853027},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6216999888420105},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.54339998960495},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5266000032424927},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.522599995136261},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.48570001125335693},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4440999925136566},{"id":"https://openalex.org/C119043178","wikidata":"https://www.wikidata.org/wiki/Q320723","display_name":"Covariate","level":2,"score":0.3978999853134155},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.3718999922275543},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.34130001068115234},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C194232998","wikidata":"https://www.wikidata.org/wiki/Q1606712","display_name":"Transition (genetics)","level":3,"score":0.30160000920295715},{"id":"https://openalex.org/C163415756","wikidata":"https://www.wikidata.org/wiki/Q126473","display_name":"Contraction (grammar)","level":2,"score":0.29789999127388},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2669999897480011},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.2621999979019165},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25540000200271606},{"id":"https://openalex.org/C47822265","wikidata":"https://www.wikidata.org/wiki/Q854457","display_name":"Complex system","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2503.15918","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15918","pdf_url":"https://arxiv.org/pdf/2503.15918","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2503.15918","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.15918","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.15918","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.15918","pdf_url":"https://arxiv.org/pdf/2503.15918","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"A":[0],"fundamental":[1],"challenge":[2],"in":[3,35],"imitation":[4,151,178],"learning":[5,152,179],"is":[6,140],"the":[7,60,64,83,87,109,118,128,132,163],"\\emph{covariate":[8],"shift}":[9],"problem.":[10],"Existing":[11],"methods":[12],"to":[13,23,49,142,162],"mitigate":[14,50],"covariate":[15,51],"shift":[16,52],"often":[17],"require":[18],"additional":[19,156],"expert":[20,157],"interactions,":[21],"access":[22],"environment":[24],"dynamics,":[25],"or":[26,159],"complex":[27,160],"adversarial":[28],"training,":[29],"which":[30],"may":[31],"not":[32],"be":[33,146],"practical":[34],"real-world":[36],"applications.":[37],"In":[38],"this":[39,102],"paper,":[40],"we":[41],"propose":[42],"a":[43,55,75,91,123],"simple":[44],"yet":[45],"effective":[46],"method":[47,139],"(DeCIL)":[48],"by":[53],"incorporating":[54],"denoising":[56,94,106,119],"mechanism":[57],"that":[58,81,100,117,169],"enhances":[59],"contraction":[61,125],"properties":[62],"of":[63,131,176],"state":[65,85,103,133],"transition":[66,134],"mapping.":[67],"Our":[68,138],"approach":[69,171],"involves":[70],"training":[71,164],"two":[72],"neural":[73],"networks:":[74],"dynamics":[76],"model":[77],"(":[78,97],"f":[79],")":[80,99],"predicts":[82],"next":[84],"from":[86],"current":[88],"state,":[89],"and":[90,107,135,144],"joint":[92],"state-action":[93],"policy":[95],"network":[96,120],"d":[98],"refines":[101],"prediction":[104],"via":[105],"outputs":[108],"corresponding":[110],"action.":[111],"We":[112],"provide":[113],"theoretical":[114],"analysis":[115],"showing":[116],"acts":[121],"as":[122],"local":[124],"mapping,":[126],"reducing":[127],"error":[129],"propagation":[130],"improving":[136],"stability.":[137],"straightforward":[141],"implement":[143],"can":[145],"easily":[147],"integrated":[148],"with":[149],"existing":[150],"frameworks":[153],"without":[154],"requiring":[155],"data":[158],"modifications":[161],"procedure.":[165],"Empirical":[166],"results":[167],"demonstrate":[168],"our":[170],"effectively":[172],"improves":[173],"success":[174],"rate":[175],"various":[177],"tasks":[180],"under":[181],"noise":[182],"perturbation.":[183]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-17T00:00:00"}
