{"id":"https://openalex.org/W3000889789","doi":"https://doi.org/10.32657/10356/136763","title":"Understanding and improving interactive systems design with human-in-the-loop machine learning","display_name":"Understanding and improving interactive systems design with human-in-the-loop machine learning","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3000889789","doi":"https://doi.org/10.32657/10356/136763","mag":"3000889789"},"language":"en","primary_location":{"id":"doi:10.32657/10356/136763","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/136763","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/136763/2/Final_thesis_Zhang_Yaqian.pdf","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},"type":"dissertation","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/136763/2/Final_thesis_Zhang_Yaqian.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100761536","display_name":"Yaqian Zhang","orcid":"https://orcid.org/0000-0003-0267-0879"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Yaqian","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5100761536"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8151552081108093},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6285539269447327},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.625440776348114},{"id":"https://openalex.org/keywords/human-in-the-loop","display_name":"Human-in-the-loop","score":0.62152498960495},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.6089990139007568},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5985831022262573},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5471280813217163},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4718496799468994},{"id":"https://openalex.org/keywords/loop","display_name":"Loop (graph theory)","score":0.47051018476486206},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.38871434330940247}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8151552081108093},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6285539269447327},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.625440776348114},{"id":"https://openalex.org/C2780626000","wikidata":"https://www.wikidata.org/wiki/Q5936775","display_name":"Human-in-the-loop","level":2,"score":0.62152498960495},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.6089990139007568},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5985831022262573},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5471280813217163},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4718496799468994},{"id":"https://openalex.org/C184670325","wikidata":"https://www.wikidata.org/wiki/Q512604","display_name":"Loop (graph theory)","level":2,"score":0.47051018476486206},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.38871434330940247},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.32657/10356/136763","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/136763","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/136763/2/Final_thesis_Zhang_Yaqian.pdf","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/136763","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/136763","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Thesis-Doctor of Philosophy"}],"best_oa_location":{"id":"doi:10.32657/10356/136763","is_oa":true,"landing_page_url":"https://doi.org/10.32657/10356/136763","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/136763/2/Final_thesis_Zhang_Yaqian.pdf","source":null,"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Nanyang Technological University","raw_type":"dissertation"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3000889789.pdf","grobid_xml":"https://content.openalex.org/works/W3000889789.grobid-xml"},"referenced_works_count":137,"referenced_works":["https://openalex.org/W27261483","https://openalex.org/W41757025","https://openalex.org/W83447802","https://openalex.org/W101836494","https://openalex.org/W131488235","https://openalex.org/W618991135","https://openalex.org/W1191599655","https://openalex.org/W1427025258","https://openalex.org/W1498180239","https://openalex.org/W1499869008","https://openalex.org/W1510073064","https://openalex.org/W1515851193","https://openalex.org/W1523767002","https://openalex.org/W1530276735","https://openalex.org/W1703398075","https://openalex.org/W1746901417","https://openalex.org/W1747565446","https://openalex.org/W1754268392","https://openalex.org/W1771410628","https://openalex.org/W1975152892","https://openalex.org/W1977591411","https://openalex.org/W1983069677","https://openalex.org/W1986021671","https://openalex.org/W1996329987","https://openalex.org/W2001619934","https://openalex.org/W2013142139","https://openalex.org/W2014032207","https://openalex.org/W2017088752","https://openalex.org/W2017107247","https://openalex.org/W2018789853","https://openalex.org/W2028692765","https://openalex.org/W2032843080","https://openalex.org/W2032998783","https://openalex.org/W2040658551","https://openalex.org/W2043977898","https://openalex.org/W2046518304","https://openalex.org/W2048365415","https://openalex.org/W2053075547","https://openalex.org/W2053718475","https://openalex.org/W2055734602","https://openalex.org/W2065808876","https://openalex.org/W2070855716","https://openalex.org/W2071949631","https://openalex.org/W2077414173","https://openalex.org/W2079476777","https://openalex.org/W2090658088","https://openalex.org/W2092736096","https://openalex.org/W2095668460","https://openalex.org/W2098515641","https://openalex.org/W2100855956","https://openalex.org/W2101561060","https://openalex.org/W2103459159","https://openalex.org/W2103993786","https://openalex.org/W2108630796","https://openalex.org/W2108738385","https://openalex.org/W2110119381","https://openalex.org/W2110687866","https://openalex.org/W2115403524","https://openalex.org/W2116736830","https://openalex.org/W2119717200","https://openalex.org/W2126046748","https://openalex.org/W2127218421","https://openalex.org/W2128804044","https://openalex.org/W2129991388","https://openalex.org/W2133808442","https://openalex.org/W2137345341","https://openalex.org/W2139233234","https://openalex.org/W2145339207","https://openalex.org/W2147768505","https://openalex.org/W2151784643","https://openalex.org/W2152414052","https://openalex.org/W2152871594","https://openalex.org/W2153111836","https://openalex.org/W2153874175","https://openalex.org/W2154447040","https://openalex.org/W2155027007","https://openalex.org/W2158782408","https://openalex.org/W2160527423","https://openalex.org/W2162506329","https://openalex.org/W2163033248","https://openalex.org/W2163605009","https://openalex.org/W2164571637","https://openalex.org/W2165150801","https://openalex.org/W2165835468","https://openalex.org/W2165960883","https://openalex.org/W2170567160","https://openalex.org/W2201581102","https://openalex.org/W2260756217","https://openalex.org/W2278288686","https://openalex.org/W2280163991","https://openalex.org/W2300445845","https://openalex.org/W2323085590","https://openalex.org/W2337351188","https://openalex.org/W2395927087","https://openalex.org/W2398193891","https://openalex.org/W2401887447","https://openalex.org/W2411687077","https://openalex.org/W2413509892","https://openalex.org/W2520350376","https://openalex.org/W2543669033","https://openalex.org/W2556669480","https://openalex.org/W2577350134","https://openalex.org/W2577451910","https://openalex.org/W2579135379","https://openalex.org/W2593031413","https://openalex.org/W2612958079","https://openalex.org/W2615533740","https://openalex.org/W2739702254","https://openalex.org/W2747188572","https://openalex.org/W2766447205","https://openalex.org/W2786303200","https://openalex.org/W2786887383","https://openalex.org/W2793471804","https://openalex.org/W2904617079","https://openalex.org/W2950492145","https://openalex.org/W2951799221","https://openalex.org/W2964003344","https://openalex.org/W2964043796","https://openalex.org/W2964319760","https://openalex.org/W2964337555","https://openalex.org/W3105728206","https://openalex.org/W3112073073","https://openalex.org/W3120740533","https://openalex.org/W3125846736","https://openalex.org/W4210267601","https://openalex.org/W4234236334","https://openalex.org/W4238392649","https://openalex.org/W4240039288","https://openalex.org/W4242401062","https://openalex.org/W4245652239","https://openalex.org/W4247820460","https://openalex.org/W4252105763","https://openalex.org/W4253794406","https://openalex.org/W4256078332","https://openalex.org/W4296586256","https://openalex.org/W4300618951","https://openalex.org/W4302570325"],"related_works":["https://openalex.org/W24774503","https://openalex.org/W4306904969","https://openalex.org/W4288099294","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W4367173559","https://openalex.org/W2782058284","https://openalex.org/W3103937890"],"abstract_inverted_index":{"New":[0],"developments":[1],"in":[2,122,148,151],"machine":[3,40],"learning":[4,41,60],"techniques":[5],"have":[6],"created":[7],"opportunities":[8],"for":[9],"the":[10,27,47,53,74,117,123],"Human-Computer":[11],"Interaction":[12],"(HCI)":[13],"community":[14],"to":[15,20,45,67,72,107,115,138,141],"incorporate":[16,97],"more":[17],"intelligent":[18],"means":[19],"improve":[21,46],"and":[22,34,65,132,135,144,150],"enhance":[23,108],"user":[24],"experience":[25],"during":[26],"interaction.":[28],"This":[29],"thesis":[30],"starts":[31],"by":[32,77],"exploring":[33],"identifying":[35],"a":[36,58,86],"suitable":[37,59],"role":[38],"where":[39],"algorithms":[42],"can":[43,96],"play":[44],"design":[48],"of":[49,100,128],"interactive":[50,79],"systems.":[51,80],"Once":[52],"area":[54],"has":[55,62],"been":[56,63],"identified,":[57],"algorithm":[61],"designed":[64],"evaluated":[66],"ensure":[68],"it":[69],"is":[70],"able":[71,140],"address":[73,83],"constraints":[75],"posed":[76],"human-in-the-loop":[78],"tasks.":[81],"To":[82],"these":[84],"constraints,":[85],"novel":[87],"bootstrapped":[88],"policy":[89,105],"gradient":[90,106],"(BPG)":[91],"framework":[92],"was":[93,113,136],"developed,":[94],"which":[95],"prior":[98],"knowledge":[99],"di":[101,118],"culty":[102,119],"ranking":[103],"into":[104],"sample":[109],"e":[110],"ciency.":[111],"BPG":[112],"applied":[114],"solve":[116],"adaptation":[120],"problem":[121],"challenging":[124],"RL":[125],"environment":[126],"comprising":[127],"large":[129],"action":[130],"spaces":[131],"short":[133],"horizon,":[134],"demonstrated":[137],"be":[139],"achieve":[142],"fast":[143],"unbiased":[145],"convergence":[146],"both":[147],"theory":[149],"practice.":[152]},"counts_by_year":[],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
