{"id":"https://openalex.org/W2022398498","doi":"https://doi.org/10.1109/slt.2014.7078593","title":"Temporal supervised learning for inferring a dialog policy from example conversations","display_name":"Temporal supervised learning for inferring a dialog policy from example conversations","publication_year":2014,"publication_date":"2014-12-01","ids":{"openalex":"https://openalex.org/W2022398498","doi":"https://doi.org/10.1109/slt.2014.7078593","mag":"2022398498"},"language":"en","primary_location":{"id":"doi:10.1109/slt.2014.7078593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt.2014.7078593","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100711454","display_name":"Lihong Li","orcid":"https://orcid.org/0000-0002-5440-8242"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lihong Li","raw_affiliation_strings":["Minicrosoft Research, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Minicrosoft Research, Redmond, WA, USA","institution_ids":[]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100775952","display_name":"He He","orcid":"https://orcid.org/0000-0002-9118-2449"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"He He","raw_affiliation_strings":["University of Maryland, College Park, MD, USA","University of Maryland \u2014 College Park, USA,"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD, USA","institution_ids":["https://openalex.org/I66946132"]},{"raw_affiliation_string":"University of Maryland \u2014 College Park, USA,","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103246485","display_name":"J. D. Williams","orcid":"https://orcid.org/0000-0003-2460-9673"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason D. Williams","raw_affiliation_strings":["Minicrosoft Research, Redmond, WA, USA","[Microsoft Research,Redmond,WA,USA]"],"affiliations":[{"raw_affiliation_string":"Minicrosoft Research, Redmond, WA, USA","institution_ids":[]},{"raw_affiliation_string":"[Microsoft Research,Redmond,WA,USA]","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100711454"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":2.96,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.92073297,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"312","last_page":"317"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.913170337677002},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8404190540313721},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7492047548294067},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6999722719192505},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.5505849123001099},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5105913281440735},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.5070676803588867},{"id":"https://openalex.org/keywords/dialog-system","display_name":"Dialog system","score":0.5005178451538086},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4539473056793213},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36207157373428345},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.08485344052314758},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.07444176077842712}],"concepts":[{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.913170337677002},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8404190540313721},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7492047548294067},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6999722719192505},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.5505849123001099},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5105913281440735},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.5070676803588867},{"id":"https://openalex.org/C190954187","wikidata":"https://www.wikidata.org/wiki/Q5270587","display_name":"Dialog system","level":3,"score":0.5005178451538086},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4539473056793213},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36207157373428345},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.08485344052314758},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.07444176077842712},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/slt.2014.7078593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt.2014.7078593","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.699.6417","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.699.6417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.research.rutgers.edu/%7Elihong/pub/Li14Temporal.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.702.9669","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.702.9669","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.umiacs.umd.edu/%7Ehhe/paper-slt.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W120790241","https://openalex.org/W192920577","https://openalex.org/W1520048352","https://openalex.org/W1931877416","https://openalex.org/W1979299372","https://openalex.org/W1986014385","https://openalex.org/W1999874108","https://openalex.org/W2021151961","https://openalex.org/W2054795804","https://openalex.org/W2080045301","https://openalex.org/W2098774185","https://openalex.org/W2104544334","https://openalex.org/W2111550420","https://openalex.org/W2119567691","https://openalex.org/W2120346334","https://openalex.org/W2121863487","https://openalex.org/W2141559645","https://openalex.org/W2158349948","https://openalex.org/W2334782222","https://openalex.org/W2468040214","https://openalex.org/W2586680856","https://openalex.org/W2962957031","https://openalex.org/W4214717370","https://openalex.org/W4285719527","https://openalex.org/W6604922617","https://openalex.org/W6607789263","https://openalex.org/W6640174482","https://openalex.org/W6664273919","https://openalex.org/W6670543721","https://openalex.org/W6674884181","https://openalex.org/W6677737365","https://openalex.org/W6720222513"],"related_works":["https://openalex.org/W48079147","https://openalex.org/W2394821827","https://openalex.org/W326836678","https://openalex.org/W2500779211","https://openalex.org/W1963944933","https://openalex.org/W2563921006","https://openalex.org/W1600043506","https://openalex.org/W2174703168","https://openalex.org/W2111550420","https://openalex.org/W3133893348"],"abstract_inverted_index":{"This":[0],"paper":[1],"tackles":[2],"the":[3,25,28,46,50,143,149,154,157,164],"problem":[4,61],"of":[5,27,49,86,113,135,156],"learning":[6,66,71,179],"a":[7,39,73,83,90,94,117,160,172,182],"dialog":[8,37,54,91,145,161,173],"policy":[9],"from":[10,16,104,127],"example":[11,105,128],"dialogs":[12,106],"-":[13,52],"for":[14],"example,":[15],"Wizard-of-Oz":[17],"style":[18],"dialogs,":[19,129],"where":[20],"an":[21],"expert":[22],"(person)":[23],"plays":[24],"role":[26],"system.":[29],"Learning":[30,123],"in":[31,42,163,167],"this":[32,60],"setting":[33],"is":[34,38,140],"challenging":[35],"because":[36],"temporal":[40,177],"process":[41],"which":[43,124],"actions":[44],"affect":[45],"future":[47],"course":[48],"conversation":[51],"i.e.,":[53],"requires":[55,79],"planning.":[56,114,136],"Past":[57],"work":[58],"solved":[59],"with":[62,176],"either":[63],"conventional":[64,186],"supervised":[65,98,178,187],"or":[67,93],"reinforcement":[68],"learning.":[69,188],"Reinforcement":[70],"provides":[72],"principled":[74],"approach":[75],"to":[76,141,147],"planning,":[77],"but":[78,107],"more":[80],"resources":[81],"than":[82],"fixed":[84],"corpus":[85],"examples,":[87],"such":[88],"as":[89],"simulator":[92],"reward":[95],"function.":[96],"Conventional":[97],"learning,":[99],"by":[100],"contrast,":[101],"operates":[102],"directly":[103,126],"does":[108],"not":[109],"take":[110],"proper":[111,133],"account":[112,134],"We":[115],"introduce":[116],"new":[118],"algorithm":[119],"called":[120],"Temporal":[121],"Supervised":[122],"learns":[125],"while":[130],"also":[131],"taking":[132],"The":[137],"key":[138],"idea":[139],"choose":[142],"next":[144],"action":[146],"maximize":[148],"expected":[150],"discounted":[151],"accuracy":[152],"until":[153],"end":[155],"dialog.":[158],"On":[159],"testbed":[162],"calendar":[165],"domain,":[166],"simulation,":[168],"we":[169],"show":[170],"that":[171],"manager":[174],"trained":[175,184],"substantially":[180],"outperforms":[181],"baseline":[183],"using":[185]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
