{"id":"https://openalex.org/W2542999985","doi":"https://doi.org/10.1109/icsda.2014.7051436","title":"Conversation dialog corpora from television and movie scripts","display_name":"Conversation dialog corpora from television and movie scripts","publication_year":2014,"publication_date":"2014-09-01","ids":{"openalex":"https://openalex.org/W2542999985","doi":"https://doi.org/10.1109/icsda.2014.7051436","mag":"2542999985"},"language":"en","primary_location":{"id":"doi:10.1109/icsda.2014.7051436","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsda.2014.7051436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 17th Oriental Chapter of the International Committee for the Co-ordination and Standardization of Speech Databases and Assessment Techniques (COCOSDA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075433335","display_name":"Lasguido Nio","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Lasguido Nio","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040108974","display_name":"Sakriani Sakti","orcid":"https://orcid.org/0000-0001-5509-8963"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Sakriani Sakti","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000692949","display_name":"Graham Neubig","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Graham Neubig","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078330211","display_name":"Tomoki Toda","orcid":"https://orcid.org/0000-0001-8146-1279"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomoki Toda","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020994673","display_name":"Satoshi Nakamura","orcid":"https://orcid.org/0000-0001-6956-3803"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Satoshi Nakamura","raw_affiliation_strings":["Graduate School of Information Science, Nara Institute of Science and Technology, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science, Nara Institute of Science and Technology, Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5075433335"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":0.818,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.82812425,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"8","issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.9720709323883057},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7699608206748962},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.6285452246665955},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.5545392632484436},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4562552869319916},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3688585162162781},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35798126459121704},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.34465041756629944},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.3054201006889343},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.28477391600608826}],"concepts":[{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.9720709323883057},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7699608206748962},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.6285452246665955},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.5545392632484436},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4562552869319916},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3688585162162781},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35798126459121704},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.34465041756629944},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3054201006889343},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.28477391600608826},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icsda.2014.7051436","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsda.2014.7051436","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 17th Oriental Chapter of the International Committee for the Co-ordination and Standardization of Speech Databases and Assessment Techniques (COCOSDA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W10957333","https://openalex.org/W147552783","https://openalex.org/W250521078","https://openalex.org/W1536972981","https://openalex.org/W1539562568","https://openalex.org/W1979299372","https://openalex.org/W1985227831","https://openalex.org/W2097828466","https://openalex.org/W2102258316","https://openalex.org/W2119788759","https://openalex.org/W2127693399","https://openalex.org/W2160458012","https://openalex.org/W2161466446","https://openalex.org/W2169498842","https://openalex.org/W2251155198","https://openalex.org/W2484132317","https://openalex.org/W2574874554","https://openalex.org/W4236521339","https://openalex.org/W4254215309","https://openalex.org/W6600426076","https://openalex.org/W6606056973","https://openalex.org/W6609523175","https://openalex.org/W6632482024","https://openalex.org/W6683412400","https://openalex.org/W6691370976","https://openalex.org/W6731835169"],"related_works":["https://openalex.org/W2098987383","https://openalex.org/W2417260800","https://openalex.org/W1596203174","https://openalex.org/W2117933979","https://openalex.org/W2283130723","https://openalex.org/W103938586","https://openalex.org/W2104718772","https://openalex.org/W4233992201","https://openalex.org/W1968552888","https://openalex.org/W2292950558"],"abstract_inverted_index":{"Example-based":[0],"dialogue":[1],"systems":[2],"often":[3],"require":[4],"natural":[5],"conversation":[6,18,62,91,102,108,125,133],"templates":[7],"as":[8],"examples":[9],"for":[10],"response":[11],"generation.":[12],"However,":[13,49],"in":[14],"previous":[15],"work":[16,51],"most":[17],"corpora":[19,126],"have":[20],"been":[21],"created":[22],"by":[23,94,136],"hand":[24],"and":[25,44,54,66,73,79],"do":[26],"not":[27],"well":[28],"portray":[29],"actual":[30],"conversations":[31,70,115],"between":[32],"two":[33,95,119,137],"people.":[34],"One":[35],"way":[36],"to":[37,42,87,113,140],"overcome":[38],"this":[39,50,58],"problem":[40],"is":[41,52,92],"record":[43],"transcribe":[45],"real":[46],"human-to-human":[47],"conversation.":[48],"tedious":[53],"time":[55],"consuming.":[56],"In":[57,85,121],"work,":[59],"we":[60,97],"utilize":[61],"scripts":[63,75],"from":[64,71,76],"television":[65,72],"movies.":[67],"We":[68],"extract":[69],"movie":[74],"the":[77,90,122],"web":[78],"perform":[80],"various":[81],"types":[82],"of":[83,101],"filtering.":[84],"order":[86],"ensure":[88],"that":[89,131],"performed":[93,135],"speakers,":[96],"introduce":[98],"a":[99,104],"unit":[100],"called":[103],"tri-turn":[105],"(a":[106],"trigram":[107],"turn)":[109],"which":[110],"allow":[111],"us":[112],"filter":[114],"with":[116],"more":[117],"than":[118],"speakers.":[120],"end,":[123],"our":[124],"contains":[127],"86,719":[128],"query-response":[129],"pairs":[130],"represent":[132],"turns":[134],"speakers":[138],"talking":[139],"each":[141],"other.":[142]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
