{"id":"https://openalex.org/W2922180654","doi":"https://doi.org/10.23919/apsipa.2018.8659528","title":"Weakly Labeled Learning Using BLSTM-CTC for Sound Event Detection","display_name":"Weakly Labeled Learning Using BLSTM-CTC for Sound Event Detection","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2922180654","doi":"https://doi.org/10.23919/apsipa.2018.8659528","mag":"2922180654"},"language":"en","primary_location":{"id":"doi:10.23919/apsipa.2018.8659528","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apsipa.2018.8659528","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066093174","display_name":"Taiki Matsuyoshi","orcid":null},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Taiki Matsuyoshi","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113730169","display_name":"Tatsuya Komatsu","orcid":null},"institutions":[{"id":"https://openalex.org/I118347220","display_name":"NEC (Japan)","ror":"https://ror.org/04jndar25","country_code":"JP","type":"company","lineage":["https://openalex.org/I118347220"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tatsuya Komatsu","raw_affiliation_strings":["NEC Corporation, Japan"],"affiliations":[{"raw_affiliation_string":"NEC Corporation, Japan","institution_ids":["https://openalex.org/I118347220"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041279908","display_name":"Reishi Kondo","orcid":null},"institutions":[{"id":"https://openalex.org/I118347220","display_name":"NEC (Japan)","ror":"https://ror.org/04jndar25","country_code":"JP","type":"company","lineage":["https://openalex.org/I118347220"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Reishi Kondo","raw_affiliation_strings":["NEC Corporation, Japan"],"affiliations":[{"raw_affiliation_string":"NEC Corporation, Japan","institution_ids":["https://openalex.org/I118347220"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073170587","display_name":"Takeshi Yamada","orcid":"https://orcid.org/0000-0002-5744-8469"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takeshi Yamada","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075702573","display_name":"Shoji Makino","orcid":"https://orcid.org/0000-0003-1934-640X"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shoji Makino","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5066093174"],"corresponding_institution_ids":["https://openalex.org/I146399215"],"apc_list":null,"apc_paid":null,"fwci":0.4954,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.66425777,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1918","last_page":"1923"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7445740103721619},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6305934190750122},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.516967236995697},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4890049695968628},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4834826588630676},{"id":"https://openalex.org/keywords/timestamp","display_name":"Timestamp","score":0.47562435269355774},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4642435312271118},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.43843719363212585},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37854301929473877},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0799306333065033}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7445740103721619},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6305934190750122},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.516967236995697},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4890049695968628},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4834826588630676},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.47562435269355774},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4642435312271118},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.43843719363212585},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37854301929473877},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0799306333065033},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/apsipa.2018.8659528","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apsipa.2018.8659528","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1566256432","https://openalex.org/W1650531274","https://openalex.org/W2064675550","https://openalex.org/W2107878631","https://openalex.org/W2127141656","https://openalex.org/W2331166300","https://openalex.org/W2408239454","https://openalex.org/W2483962956","https://openalex.org/W2678199776","https://openalex.org/W2786317847","https://openalex.org/W6633947590","https://openalex.org/W6702387769"],"related_works":["https://openalex.org/W2060561905","https://openalex.org/W1417711376","https://openalex.org/W1986883493","https://openalex.org/W2469862403","https://openalex.org/W2166378262","https://openalex.org/W4379524643","https://openalex.org/W2035891203","https://openalex.org/W2367807705","https://openalex.org/W2011027677","https://openalex.org/W2951720331"],"abstract_inverted_index":{"In":[0,70],"this":[1],"paper,":[2],"we":[3,74,139],"propose":[4],"a":[5,83,121,141,164,206,227],"method":[6,168],"of":[7,11,27,37,45,65,80,86,94,99,124,135,154,209],"weakly":[8,56,114,125,218],"labeled":[9,57,78,88,115,126,211,219],"learning":[10,28,79,116,180,204,220,224],"bidirectional":[12],"long":[13],"short-term":[14],"memory":[15],"(BLSTM)":[16],"using":[17,42,55,82,120,146,205],"connectionist":[18],"temporal":[19],"classification":[20],"(BLSTM-CTC)":[21],"to":[22,33],"reduce":[23],"the":[24,35,46,62,71,92,95,133,136,147,166,170,178,188,194],"hand-labeling":[25,229],"cost":[26,190],"samples.":[29,212],"BLSTM-CTC":[30,119],"enables":[31],"us":[32],"update":[34],"parameters":[36],"BLSTM":[38,81,225],"by":[39,150,174,191,199],"loss":[40],"calculation":[41,49],"CTC,":[43],"instead":[44],"exact":[47],"error":[48],"that":[50,216],"cannot":[51],"be":[52],"conducted":[53,140],"when":[54],"samples,":[58,89],"which":[59,90],"have":[60,91],"only":[61],"event":[63,103,106,143],"class":[64],"each":[66,100],"individual":[67,101],"sound":[68,102,142],"event.":[69],"proposed":[72,137,167],"method,":[73,138],"first":[75],"conduct":[76,113],"strongly":[77,87,210],"small":[84],"amount":[85,123,208],"timestamps":[93],"beginning":[96],"and":[97,104,152,157],"end":[98],"its":[105],"class,":[107],"as":[108,128],"initial":[109,179],"learning.":[110,130],"We":[111],"then":[112],"based":[117],"on":[118],"large":[122,207],"samples":[127],"additional":[129,203],"To":[131],"evaluate":[132],"performance":[134],"detection":[144],"experiment":[145],"dataset":[148],"provided":[149],"Detection":[151],"Classification":[153],"Acoustic":[155],"Scenes":[156],"Events":[158],"(DCASE)":[159],"2016":[160],"Task":[161],"2.":[162],"As":[163],"result,":[165],"improved":[169],"segment-based":[171],"F1":[172,195],"score":[173,196],"1.9%":[175],"compared":[176],"with":[177,202,226],"mentioned":[181],"above.":[182],"Furthermore,":[183],"it":[184],"succeeded":[185],"in":[186],"reducing":[187],"labeling":[189],"95%,":[192],"although":[193],"was":[197],"degraded":[198],"1.3%,":[200],"comparing":[201],"This":[213],"result":[214],"confirms":[215],"our":[217],"is":[221],"effective":[222],"for":[223],"low":[228],"cost.":[230]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
