{"id":"https://openalex.org/W3159239022","doi":"https://doi.org/10.23919/dafx51585.2021.9768246","title":"One Billion Audio Sounds from GPU-Enabled Modular Synthesis","display_name":"One Billion Audio Sounds from GPU-Enabled Modular Synthesis","publication_year":2021,"publication_date":"2021-09-08","ids":{"openalex":"https://openalex.org/W3159239022","doi":"https://doi.org/10.23919/dafx51585.2021.9768246","mag":"3159239022"},"language":"en","primary_location":{"id":"doi:10.23919/dafx51585.2021.9768246","is_oa":false,"landing_page_url":"https://doi.org/10.23919/dafx51585.2021.9768246","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 24th International Conference on Digital Audio Effects (DAFx)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072002276","display_name":"Joseph Turian","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123192","display_name":"International Audio Laboratories Erlangen","ror":"https://ror.org/02mkz3e80","country_code":"DE","type":"facility","lineage":["https://openalex.org/I181369854","https://openalex.org/I4210123192","https://openalex.org/I4210124274","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Joseph Turian","raw_affiliation_strings":["Spooky Audio,Berlin,Germany","Spooky Audio, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Spooky Audio,Berlin,Germany","institution_ids":["https://openalex.org/I4210123192"]},{"raw_affiliation_string":"Spooky Audio, Berlin, Germany","institution_ids":["https://openalex.org/I4210123192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114117312","display_name":"Jordie Shier","orcid":null},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Jordie Shier","raw_affiliation_strings":["Computer Science and Music Technology, University of Victoria,Victoria,Canada","Computer Science and Music Technology, University of Victoria, Victoria, Canada"],"affiliations":[{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria,Victoria,Canada","institution_ids":["https://openalex.org/I212119943"]},{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria, Victoria, Canada","institution_ids":["https://openalex.org/I212119943"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010445045","display_name":"George Tzanetakis","orcid":"https://orcid.org/0000-0002-6844-7912"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"George Tzanetakis","raw_affiliation_strings":["Computer Science and Music Technology, University of Victoria,Victoria,Canada","Computer Science and Music Technology, University of Victoria, Victoria, Canada"],"affiliations":[{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria,Victoria,Canada","institution_ids":["https://openalex.org/I212119943"]},{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria, Victoria, Canada","institution_ids":["https://openalex.org/I212119943"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007870362","display_name":"Kirk McNally","orcid":"https://orcid.org/0000-0001-5589-2614"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Kirk McNally","raw_affiliation_strings":["Computer Science and Music Technology, University of Victoria,Victoria,Canada","Computer Science and Music Technology, University of Victoria, Victoria, Canada"],"affiliations":[{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria,Victoria,Canada","institution_ids":["https://openalex.org/I212119943"]},{"raw_affiliation_string":"Computer Science and Music Technology, University of Victoria, Victoria, Canada","institution_ids":["https://openalex.org/I212119943"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008144020","display_name":"Max Henry","orcid":"https://orcid.org/0000-0003-2981-4000"},"institutions":[{"id":"https://openalex.org/I5023651","display_name":"McGill University","ror":"https://ror.org/01pxwe438","country_code":"CA","type":"education","lineage":["https://openalex.org/I5023651"]},{"id":"https://openalex.org/I4210145168","display_name":"Centre for Interdisciplinary Research in Music Media and Technology","ror":"https://ror.org/03f3kev64","country_code":"CA","type":"facility","lineage":["https://openalex.org/I4210145168"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Max Henry","raw_affiliation_strings":["Music Technology Area McGill University,Montreal,Canada","Music Technology Area McGill University, Montreal, Canada"],"affiliations":[{"raw_affiliation_string":"Music Technology Area McGill University,Montreal,Canada","institution_ids":["https://openalex.org/I4210145168","https://openalex.org/I5023651"]},{"raw_affiliation_string":"Music Technology Area McGill University, Montreal, Canada","institution_ids":["https://openalex.org/I4210145168","https://openalex.org/I5023651"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5072002276"],"corresponding_institution_ids":["https://openalex.org/I4210123192"],"apc_list":null,"apc_paid":null,"fwci":2.4689,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.89770676,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"222","last_page":"229"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8111788630485535},{"id":"https://openalex.org/keywords/timbre","display_name":"Timbre","score":0.714442253112793},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5581148266792297},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5375762581825256},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.5349987745285034},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.4539657533168793},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.42411544919013977},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25001996755599976},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.12132734060287476},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.12113121151924133}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8111788630485535},{"id":"https://openalex.org/C2776539107","wikidata":"https://www.wikidata.org/wiki/Q176501","display_name":"Timbre","level":3,"score":0.714442253112793},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5581148266792297},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5375762581825256},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.5349987745285034},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.4539657533168793},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.42411544919013977},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25001996755599976},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.12132734060287476},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12113121151924133},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/dafx51585.2021.9768246","is_oa":false,"landing_page_url":"https://doi.org/10.23919/dafx51585.2021.9768246","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 24th International Conference on Digital Audio Effects (DAFx)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1556219185","https://openalex.org/W1566660863","https://openalex.org/W1581410183","https://openalex.org/W1986595194","https://openalex.org/W1998446618","https://openalex.org/W2032197604","https://openalex.org/W2109664771","https://openalex.org/W2131676173","https://openalex.org/W2250384498","https://openalex.org/W2593116425","https://openalex.org/W2605102758","https://openalex.org/W2606176153","https://openalex.org/W2791716806","https://openalex.org/W2898148140","https://openalex.org/W2939574508","https://openalex.org/W2949676527","https://openalex.org/W2950547518","https://openalex.org/W2955263139","https://openalex.org/W2964300898","https://openalex.org/W2990440871","https://openalex.org/W2995181338","https://openalex.org/W2995233853","https://openalex.org/W2999531799","https://openalex.org/W3000389243","https://openalex.org/W3005680577","https://openalex.org/W3015338123","https://openalex.org/W3021164770","https://openalex.org/W3030163527","https://openalex.org/W3034978746","https://openalex.org/W3035312337","https://openalex.org/W3047579126","https://openalex.org/W3088942650","https://openalex.org/W3097934054","https://openalex.org/W3103455452","https://openalex.org/W3110955493","https://openalex.org/W3122300013","https://openalex.org/W3135828102","https://openalex.org/W3162391496","https://openalex.org/W3201143670","https://openalex.org/W4205689591","https://openalex.org/W4285367288","https://openalex.org/W4287555654","https://openalex.org/W4287715222","https://openalex.org/W4287757056","https://openalex.org/W4287802874","https://openalex.org/W4292779060","https://openalex.org/W4295910257","https://openalex.org/W6633849734","https://openalex.org/W6634561062","https://openalex.org/W6679739311","https://openalex.org/W6688325169","https://openalex.org/W6736723571","https://openalex.org/W6755182157","https://openalex.org/W6769767169","https://openalex.org/W6771763809","https://openalex.org/W6771812881","https://openalex.org/W6774314701","https://openalex.org/W6776218486","https://openalex.org/W6779191341","https://openalex.org/W6781351833","https://openalex.org/W6783462664","https://openalex.org/W6783536103","https://openalex.org/W6787485125","https://openalex.org/W6788720092"],"related_works":["https://openalex.org/W1984191430","https://openalex.org/W2150711775","https://openalex.org/W2149825536","https://openalex.org/W2108382268","https://openalex.org/W4382202539","https://openalex.org/W4287991268","https://openalex.org/W2995670387","https://openalex.org/W4323339370","https://openalex.org/W2395416690","https://openalex.org/W2109622212"],"abstract_inverted_index":{"We":[0,35],"release":[1,63],"synth1B1,":[2],"a":[3,58,91],"multi-modal":[4],"audio":[5,30,66,86],"corpus":[6],"consisting":[7],"of":[8],"1":[9],"billion":[10],"4-second":[11],"synthesized":[12],"sounds,":[13],"paired":[14],"with":[15],"the":[16,33,46],"synthesis":[17],"parameters":[18],"used":[19],"to":[20,94],"generate":[21],"them.":[22],"The":[23],"dataset":[24,31],"is":[25],"100x":[26],"larger":[27],"than":[28,54],"any":[29],"in":[32],"literature.":[34],"also":[36],"introduce":[37],"torchsynth,":[38],"an":[39],"open":[40],"source":[41],"modular":[42],"synthesizer":[43,95],"that":[44],"generates":[45],"synth":[47,69,73],"1B1":[48],"samples":[49],"on-the-fly":[50],"at":[51],"16200x":[52],"faster":[53],"real-time":[55],"(714MHz)":[56],"on":[57],"single":[59],"GPU.":[60],"Finally,":[61,88],"we":[62,78,89],"two":[64],"new":[65,80],"datasets:":[67],"FM":[68],"timbre":[70],"and":[71],"subtractive":[72],"pitch.":[74],"Using":[75],"these":[76],"datasets,":[77],"demonstrate":[79],"rank-based":[81],"evaluation":[82],"criteria":[83],"for":[84],"existing":[85],"representations.":[87],"propose":[90],"novel":[92],"approach":[93],"hyperparameter":[96],"optimization.":[97]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
