{"id":"https://openalex.org/W1522966007","doi":"https://doi.org/10.21437/interspeech.2011-565","title":"Unsupervised continuous-valued word features for phrase-break prediction without a part-of-speech tagger","display_name":"Unsupervised continuous-valued word features for phrase-break prediction without a part-of-speech tagger","publication_year":2011,"publication_date":"2011-08-27","ids":{"openalex":"https://openalex.org/W1522966007","doi":"https://doi.org/10.21437/interspeech.2011-565","mag":"1522966007"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2011-565","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-565","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://www.cstr.ed.ac.uk/downloads/publications/2011/watts_yamagishi_king_2011.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110238677","display_name":"Oliver Watts","orcid":null},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Oliver Watts","raw_affiliation_strings":["University of Edinburgh"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007639385","display_name":"Junichi Yamagishi","orcid":"https://orcid.org/0000-0003-2752-3955"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junichi Yamagishi","raw_affiliation_strings":["School of Informatics"],"affiliations":[{"raw_affiliation_string":"School of Informatics","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062516688","display_name":"Simon King","orcid":"https://orcid.org/0000-0002-2694-2843"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Simon King","raw_affiliation_strings":["School of Philosophy Psychology and Language Sciences"],"affiliations":[{"raw_affiliation_string":"School of Philosophy Psychology and Language Sciences","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110238677"],"corresponding_institution_ids":["https://openalex.org/I98677209"],"apc_list":null,"apc_paid":null,"fwci":0.8771,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.7877768,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"2157","last_page":"2160"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.796471357345581},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.7885288000106812},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6597781777381897},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6550740003585815},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.626929759979248},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5757969617843628},{"id":"https://openalex.org/keywords/part-of-speech-tagging","display_name":"Part-of-speech tagging","score":0.5459219813346863},{"id":"https://openalex.org/keywords/part-of-speech","display_name":"Part of speech","score":0.43649983406066895},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1412486732006073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.796471357345581},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.7885288000106812},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6597781777381897},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6550740003585815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.626929759979248},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5757969617843628},{"id":"https://openalex.org/C2780684714","wikidata":"https://www.wikidata.org/wiki/Q1271424","display_name":"Part-of-speech tagging","level":3,"score":0.5459219813346863},{"id":"https://openalex.org/C123406163","wikidata":"https://www.wikidata.org/wiki/Q82042","display_name":"Part of speech","level":2,"score":0.43649983406066895},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1412486732006073},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.21437/interspeech.2011-565","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-565","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:publications/f857685a-eb9b-41d8-be72-16839817a062","is_oa":true,"landing_page_url":"https://hdl.handle.net/20.500.11820/f857685a-eb9b-41d8-be72-16839817a062","pdf_url":"http://www.cstr.ed.ac.uk/downloads/publications/2011/watts_yamagishi_king_2011.pdf","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:pure.ed.ac.uk:openaire/f857685a-eb9b-41d8-be72-16839817a062","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/f857685a-eb9b-41d8-be72-16839817a062","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Watts, O, Yamagishi, J & King, S 2011, Unsupervised continuous-valued word features for phrase-break prediction without a part-of-speech tagger. in P Cosi, R De Mori, G Di Fabbrizio & R Pieraccini (eds), Proceedings of the 12th Annual Conference of the International Speech Communication Association. pp. 2157-2160, Interspeech 2011- 12th annual Conference of the International Speech Communication Association , Florence, Italy, 27/08/11. < http://www.isca-speech.org/archive/interspeech_2011/i11_2157.html >","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:pure.ed.ac.uk:publications/f857685a-eb9b-41d8-be72-16839817a062","is_oa":true,"landing_page_url":"https://hdl.handle.net/20.500.11820/f857685a-eb9b-41d8-be72-16839817a062","pdf_url":"http://www.cstr.ed.ac.uk/downloads/publications/2011/watts_yamagishi_king_2011.pdf","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1522966007.pdf","grobid_xml":"https://content.openalex.org/works/W1522966007.grobid-xml"},"referenced_works_count":13,"referenced_works":["https://openalex.org/W5192282","https://openalex.org/W47415966","https://openalex.org/W1504308419","https://openalex.org/W1576363916","https://openalex.org/W1594031697","https://openalex.org/W2025617415","https://openalex.org/W2051123508","https://openalex.org/W2081687495","https://openalex.org/W2083675498","https://openalex.org/W2086372363","https://openalex.org/W2147292124","https://openalex.org/W2170206653","https://openalex.org/W2914746235"],"related_works":["https://openalex.org/W1965453504","https://openalex.org/W2396342956","https://openalex.org/W2486838646","https://openalex.org/W2949108231","https://openalex.org/W2626026432","https://openalex.org/W2251183413","https://openalex.org/W2950520410","https://openalex.org/W2046224275","https://openalex.org/W2080020663","https://openalex.org/W2006539681"],"abstract_inverted_index":{"Part":[0],"of":[1,24,31,40,58,80,88,120],"speech":[2,19],"(POS)":[3],"tags":[4,68],"are":[5,52,99],"foremost":[6],"among":[7],"the":[8,29,36,56,59,78,85,114,121,124],"features":[9,82,98,122],"conventionally":[10],"used":[11],"to":[12,18],"predict":[13],"intonational":[14],"phrase-breaks":[15],"for":[16,35,93],"text":[17,65,108],"(TTS)":[20],"conversion.":[21],"The":[22],"construction":[23],"such":[25,48,97],"systems":[26],"therefore":[27,76],"presupposes":[28],"availability":[30],"a":[32,41,129,138,142],"POS":[33,67,94,144],"tagger":[34],"relevant":[37],"language,":[38],"or":[39],"corpus":[42],"manually":[43,63],"tagged":[44],"with":[45,66],"POS.":[46],"However,":[47],"tools":[49],"and":[50,62,72,137],"resources":[51],"not":[53],"available":[54],"in":[55,101,126],"majority":[57],"world\u2019s":[60],"languages,":[61],"labelling":[64],"is":[69],"an":[70,102,106],"expensive":[71],"time-consuming":[73],"process.":[74],"We":[75,110],"propose":[77],"use":[79,119],"continuous-valued":[81],"that":[83],"summarise":[84],"distributional":[86],"characteristics":[87],"word":[89],"types":[90],"as":[91],"surrogates":[92],"features.":[95],"Importantly,":[96],"obtained":[100],"unsupervised":[103],"manner":[104],"from":[105],"untagged":[107],"corpus.":[109],"present":[111],"results":[112],"on":[113],"phrase-break":[115],"prediction":[116],"task,":[117],"where":[118],"closes":[123],"gap":[125],"performance":[127],"between":[128],"baseline":[130],"system":[131,140],"(using":[132],"only":[133],"basic":[134],"punctuation-related":[135],"features)":[136],"topline":[139],"(incorporating":[141],"state-of-the-art":[143],"tagger).":[145]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
