{"id":"https://openalex.org/W4401906482","doi":"https://doi.org/10.1109/icdl61372.2024.10644266","title":"Learning While Sleeping: Integrating Sleep-Inspired Consolidation with Human Feedback Learning","display_name":"Learning While Sleeping: Integrating Sleep-Inspired Consolidation with Human Feedback Learning","publication_year":2024,"publication_date":"2024-05-20","ids":{"openalex":"https://openalex.org/W4401906482","doi":"https://doi.org/10.1109/icdl61372.2024.10644266"},"language":"en","primary_location":{"id":"doi:10.1109/icdl61372.2024.10644266","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icdl61372.2024.10644266","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091625881","display_name":"Imene Tarakli","orcid":"https://orcid.org/0000-0001-8975-0980"},"institutions":[{"id":"https://openalex.org/I71422933","display_name":"Sheffield Hallam University","ror":"https://ror.org/019wt1929","country_code":"GB","type":"education","lineage":["https://openalex.org/I71422933"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Imene Tarakli","raw_affiliation_strings":["Sheffield Hallam University,Sheffield,United Kingdom"],"affiliations":[{"raw_affiliation_string":"Sheffield Hallam University,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I71422933"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073115503","display_name":"Alessandro Di Nuovo","orcid":"https://orcid.org/0000-0003-2677-2650"},"institutions":[{"id":"https://openalex.org/I71422933","display_name":"Sheffield Hallam University","ror":"https://ror.org/019wt1929","country_code":"GB","type":"education","lineage":["https://openalex.org/I71422933"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alessandro Di Nuovo","raw_affiliation_strings":["Sheffield Hallam University,Sheffield,United Kingdom"],"affiliations":[{"raw_affiliation_string":"Sheffield Hallam University,Sheffield,United Kingdom","institution_ids":["https://openalex.org/I71422933"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5091625881"],"corresponding_institution_ids":["https://openalex.org/I71422933"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13392596,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10985","display_name":"Sleep and Wakefulness Research","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10985","display_name":"Sleep and Wakefulness Research","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consolidation","display_name":"Consolidation (business)","score":0.6093623042106628},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5990534424781799},{"id":"https://openalex.org/keywords/sleep","display_name":"Sleep (system call)","score":0.5410128831863403},{"id":"https://openalex.org/keywords/memory-consolidation","display_name":"Memory consolidation","score":0.5172534584999084},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38454893231391907},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.357634574174881},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.2965591549873352},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.25830113887786865},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.07982507348060608}],"concepts":[{"id":"https://openalex.org/C2776014549","wikidata":"https://www.wikidata.org/wiki/Q3050847","display_name":"Consolidation (business)","level":2,"score":0.6093623042106628},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5990534424781799},{"id":"https://openalex.org/C2775841894","wikidata":"https://www.wikidata.org/wiki/Q4683692","display_name":"Sleep (system call)","level":2,"score":0.5410128831863403},{"id":"https://openalex.org/C48455012","wikidata":"https://www.wikidata.org/wiki/Q2892593","display_name":"Memory consolidation","level":3,"score":0.5172534584999084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38454893231391907},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.357634574174881},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2965591549873352},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.25830113887786865},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.07982507348060608},{"id":"https://openalex.org/C2781161787","wikidata":"https://www.wikidata.org/wiki/Q48360","display_name":"Hippocampus","level":2,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icdl61372.2024.10644266","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icdl61372.2024.10644266","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Development and Learning (ICDL)","raw_type":"proceedings-article"},{"id":"pmh:oai:shura.shu.ac.uk:33782","is_oa":false,"landing_page_url":"http://orcid.org/0000-0003-2677-2650>","pdf_url":null,"source":{"id":"https://openalex.org/S4306401600","display_name":"SHURA (Sheffield Hallam University Research Archive) (Sheffield Hallam University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I71422933","host_organization_name":"Sheffield Hallam University","host_organization_lineage":["https://openalex.org/I71422933"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1453801241","https://openalex.org/W2060392742","https://openalex.org/W2086162146","https://openalex.org/W2121110499","https://openalex.org/W2145339207","https://openalex.org/W2149927646","https://openalex.org/W2156869222","https://openalex.org/W2550702553","https://openalex.org/W2597613574","https://openalex.org/W2916746008","https://openalex.org/W2963489214","https://openalex.org/W3002947507","https://openalex.org/W3213657171","https://openalex.org/W3213774989","https://openalex.org/W4214717370","https://openalex.org/W4283394711","https://openalex.org/W4285079896","https://openalex.org/W4287273849","https://openalex.org/W4288593469","https://openalex.org/W4362638468","https://openalex.org/W4389157295","https://openalex.org/W6732417791","https://openalex.org/W6747473740","https://openalex.org/W6758427599","https://openalex.org/W6791623595","https://openalex.org/W6797805595","https://openalex.org/W6803914020","https://openalex.org/W6858354804"],"related_works":["https://openalex.org/W2167194856","https://openalex.org/W2086243992","https://openalex.org/W1999611011","https://openalex.org/W2885453218","https://openalex.org/W4389734400","https://openalex.org/W4205580732","https://openalex.org/W2047240100","https://openalex.org/W2042354688","https://openalex.org/W2104761387","https://openalex.org/W3121414111"],"abstract_inverted_index":{"Sleep":[0],"plays":[1],"a":[2,42,49,78],"vital":[3],"role":[4],"in":[5,109,122],"developmental":[6],"learning.":[7,124],"It":[8],"allows":[9],"the":[10,19,23,35,59,69,90,94,101,110,113,117],"brain":[11],"to":[12,68,106,119],"consolidate":[13],"daily":[14],"learning":[15,60,67],"experiences":[16],"by":[17,61],"replaying":[18],"memories":[20],"accumulated":[21],"throughout":[22],"day.":[24],"In":[25],"this":[26],"work,":[27],"we":[28],"take":[29],"inspiration":[30],"from":[31,53],"sleep":[32],"and":[33,112],"propose":[34],"Inverse":[36],"Forward":[37],"Offline":[38],"Reinforcement":[39],"Model":[40],"(INFORM),":[41],"novel":[43],"scalable":[44],"framework":[45],"that":[46,75,81,87,100],"first":[47],"learns":[48,83],"set":[50],"of":[51,93],"behaviours":[52],"human":[54],"evaluative":[55],"feedback,":[56],"then":[57],"consolidates":[58],"applying":[62],"an":[63,84],"offline":[64],"inverse":[65],"reinforcement":[66],"memorised":[70],"trajectories.":[71],"Experimental":[72],"results":[73],"demonstrate":[74],"INFORM":[76],"is":[77],"feedback-efficient":[79],"method":[80],"effectively":[82],"optimal":[85],"policy":[86],"aligns":[88],"with":[89],"intended":[91],"behaviour":[92],"human.":[95],"A":[96],"comparative":[97],"analysis":[98],"shows":[99],"learnt":[102],"policies":[103],"are":[104],"robust":[105],"dynamic":[107],"changes":[108],"environment":[111],"recovered":[114],"rewards":[115],"allow":[116],"robot":[118],"be":[120],"autonomous":[121],"its":[123],"Project":[125],"website:":[126],"https://sites.google.com/view/inform-framework":[127]},"counts_by_year":[],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
