{"id":"https://openalex.org/W2067348796","doi":"https://doi.org/10.1145/2168748.2168749","title":"Optimizing the turn-taking behavior of task-oriented spoken dialog systems","display_name":"Optimizing the turn-taking behavior of task-oriented spoken dialog systems","publication_year":2012,"publication_date":"2012-05-01","ids":{"openalex":"https://openalex.org/W2067348796","doi":"https://doi.org/10.1145/2168748.2168749","mag":"2067348796"},"language":"en","primary_location":{"id":"doi:10.1145/2168748.2168749","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2168748.2168749","pdf_url":null,"source":{"id":"https://openalex.org/S200945739","display_name":"ACM Transactions on Speech and Language Processing","issn_l":"1550-4875","issn":["1550-4875","1550-4883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Speech and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045093641","display_name":"Antoine Raux","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145184","display_name":"Honda (United States)","ror":"https://ror.org/04vdmc602","country_code":"US","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210145184"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Antoine Raux","raw_affiliation_strings":["Honda Research Institute USA, Mountain View, CA","[Honda Research Institute USA, Mountain View, CA]"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Honda Research Institute USA, Mountain View, CA","institution_ids":["https://openalex.org/I4210145184"]},{"raw_affiliation_string":"[Honda Research Institute USA, Mountain View, CA]","institution_ids":["https://openalex.org/I4210145184"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077285164","display_name":"Maxine Esk\u00e9nazi","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maxine Eskenazi","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA","Carnegie-Mellon University, Pittsburgh, PA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie-Mellon University, Pittsburgh, PA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":7.5188,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.97110814,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"9","issue":"1","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8551430702209473},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.8442097902297974},{"id":"https://openalex.org/keywords/turn-taking","display_name":"Turn-taking","score":0.8157482147216797},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.7093129754066467},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6778299808502197},{"id":"https://openalex.org/keywords/dialog-system","display_name":"Dialog system","score":0.607246994972229},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5687620043754578},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5335044860839844},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.4539908170700073},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4532807469367981},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41746559739112854},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39380818605422974},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.11861509084701538}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8551430702209473},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.8442097902297974},{"id":"https://openalex.org/C2776352735","wikidata":"https://www.wikidata.org/wiki/Q2313343","display_name":"Turn-taking","level":3,"score":0.8157482147216797},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.7093129754066467},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6778299808502197},{"id":"https://openalex.org/C190954187","wikidata":"https://www.wikidata.org/wiki/Q5270587","display_name":"Dialog system","level":3,"score":0.607246994972229},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5687620043754578},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5335044860839844},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.4539908170700073},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4532807469367981},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41746559739112854},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39380818605422974},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.11861509084701538},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2168748.2168749","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2168748.2168749","pdf_url":null,"source":{"id":"https://openalex.org/S200945739","display_name":"ACM Transactions on Speech and Language Processing","issn_l":"1550-4875","issn":["1550-4875","1550-4883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Speech and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G5810314126","display_name":null,"funder_award_id":"208835","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W26306128","https://openalex.org/W50922381","https://openalex.org/W80222165","https://openalex.org/W116569011","https://openalex.org/W126426901","https://openalex.org/W167770377","https://openalex.org/W178169250","https://openalex.org/W178897730","https://openalex.org/W258661234","https://openalex.org/W792814583","https://openalex.org/W1496781369","https://openalex.org/W1502481855","https://openalex.org/W1508665521","https://openalex.org/W1516479813","https://openalex.org/W1518023928","https://openalex.org/W1518727680","https://openalex.org/W1523412775","https://openalex.org/W1549285799","https://openalex.org/W1566669007","https://openalex.org/W1582147469","https://openalex.org/W1583748115","https://openalex.org/W1593557297","https://openalex.org/W1845380253","https://openalex.org/W1903951673","https://openalex.org/W1934807246","https://openalex.org/W1964725106","https://openalex.org/W1977647663","https://openalex.org/W1986532700","https://openalex.org/W1991123335","https://openalex.org/W1998677696","https://openalex.org/W2007889078","https://openalex.org/W2008741806","https://openalex.org/W2067097374","https://openalex.org/W2093973850","https://openalex.org/W2100844198","https://openalex.org/W2108958052","https://openalex.org/W2109730238","https://openalex.org/W2116906536","https://openalex.org/W2122493499","https://openalex.org/W2127838323","https://openalex.org/W2129090275","https://openalex.org/W2134401851","https://openalex.org/W2138742901","https://openalex.org/W2143427281","https://openalex.org/W2149934480","https://openalex.org/W2153190547","https://openalex.org/W2156597615","https://openalex.org/W2156885227","https://openalex.org/W2161345458","https://openalex.org/W2235920218","https://openalex.org/W2237495196","https://openalex.org/W2325274768","https://openalex.org/W2915722758","https://openalex.org/W3143835353","https://openalex.org/W4248634141"],"related_works":["https://openalex.org/W2500779211","https://openalex.org/W48079147","https://openalex.org/W326836678","https://openalex.org/W1963944933","https://openalex.org/W2563921006","https://openalex.org/W1600043506","https://openalex.org/W2111550420","https://openalex.org/W2549666521","https://openalex.org/W2735573723","https://openalex.org/W3133893348"],"abstract_inverted_index":{"Even":[0],"as":[1,73,139,141],"progress":[2],"in":[3,41],"speech":[4],"technologies":[5],"and":[6,8,30,38,57,78,94],"task":[7],"dialog":[9,18,108],"modeling":[10],"has":[11],"allowed":[12],"the":[13,20,80,104,124,128,131],"development":[14],"of":[15,24,36,50,107,130],"advanced":[16],"spoken":[17],"systems,":[19],"low-level":[21],"interaction":[22],"behavior":[23,106],"those":[25],"systems":[26],"often":[27],"remains":[28],"rigid":[29],"inefficient.":[31],"Based":[32],"on":[33,112],"an":[34],"analysis":[35],"human-human":[37],"human-computer":[39],"turn-taking":[40,72,105],"naturally":[42],"occurring":[43],"task-oriented":[44],"dialogs,":[45],"we":[46],"define":[47],"a":[48,85,95,116,135],"set":[49],"features":[51],"that":[52,59,88,123],"can":[53,61],"be":[54,62],"automatically":[55],"extracted":[56],"show":[58],"they":[60],"used":[63],"to":[64,102,134],"inform":[65],"efficient":[66],"end-of-turn":[67],"detection.":[68],"We":[69],"then":[70],"frame":[71],"decision":[74],"making":[75],"under":[76],"uncertainty":[77],"describe":[79],"Finite-State":[81],"Turn-Taking":[82],"Machine":[83],"(FSTTM),":[84],"decision-theoretic":[86],"model":[87],"combines":[89],"data-driven":[90,143],"machine":[91],"learning":[92],"methods":[93],"cost":[96],"structure":[97],"derived":[98],"from":[99],"Conversation":[100],"Analysis":[101],"control":[103],"systems.":[109],"Evaluation":[110],"results":[111],"CMU":[113],"Let's":[114],"Go,":[115],"publicly":[117],"deployed":[118],"bus":[119],"information":[120],"system,":[121],"confirm":[122],"FSTTM":[125],"significantly":[126],"improves":[127],"responsiveness":[129],"system":[132],"compared":[133],"standard":[136],"threshold-based":[137],"approach,":[138],"well":[140],"previous":[142],"methods.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":8},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":6},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
