{"id":"https://openalex.org/W3006926732","doi":"https://doi.org/10.21437/interspeech.2020-1242","title":"Towards Learning a Universal Non-Semantic Representation of Speech","display_name":"Towards Learning a Universal Non-Semantic Representation of Speech","publication_year":2020,"publication_date":"2020-10-25","ids":{"openalex":"https://openalex.org/W3006926732","doi":"https://doi.org/10.21437/interspeech.2020-1242","mag":"3006926732"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2020-1242","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-1242","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2002.12764","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076659859","display_name":"Joel Shor","orcid":"https://orcid.org/0000-0002-6729-5988"},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Joel Shor","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103622427","display_name":"Aren Jansen","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aren Jansen","raw_affiliation_strings":["Google Research, Mountain View"],"affiliations":[{"raw_affiliation_string":"Google Research, Mountain View","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058036083","display_name":"Ronnie Maor","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Ronnie Maor","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035078692","display_name":"Oran Lang","orcid":"https://orcid.org/0000-0001-7644-8459"},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Oran Lang","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005400175","display_name":"Omry Tuval","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Omry Tuval","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026916144","display_name":"F\u00e9lix de Chaumont Quitry","orcid":"https://orcid.org/0000-0003-4959-0016"},"institutions":[{"id":"https://openalex.org/I4210100430","display_name":"Google (Switzerland)","ror":"https://ror.org/014f9c269","country_code":"CH","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210100430","https://openalex.org/I4210128969"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"F\u00e9lix de Chaumont Quitry","raw_affiliation_strings":["Google Research, Zurich"],"affiliations":[{"raw_affiliation_string":"Google Research, Zurich","institution_ids":["https://openalex.org/I4210100430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033341878","display_name":"Marco Tagliasacchi","orcid":"https://orcid.org/0000-0002-7682-6795"},"institutions":[{"id":"https://openalex.org/I4210100430","display_name":"Google (Switzerland)","ror":"https://ror.org/014f9c269","country_code":"CH","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210100430","https://openalex.org/I4210128969"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Marco Tagliasacchi","raw_affiliation_strings":["Google Research, Zurich"],"affiliations":[{"raw_affiliation_string":"Google Research, Zurich","institution_ids":["https://openalex.org/I4210100430"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081284206","display_name":"Ira Shavitt","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Ira Shavitt","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069735438","display_name":"Dotan Emanuel","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Dotan Emanuel","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070881595","display_name":"Yinnon Haviv","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117425","display_name":"Google (Israel)","ror":"https://ror.org/02c20ys54","country_code":"IL","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210117425","https://openalex.org/I4210128969"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Yinnon Haviv","raw_affiliation_strings":["Google Research, Israel"],"affiliations":[{"raw_affiliation_string":"Google Research, Israel","institution_ids":["https://openalex.org/I4210117425"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5076659859"],"corresponding_institution_ids":["https://openalex.org/I4210117425"],"apc_list":null,"apc_paid":null,"fwci":12.9343,"has_fulltext":false,"cited_by_count":124,"citation_normalized_percentile":{"value":0.99296417,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"140","last_page":"144"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8603675365447998},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7987403273582458},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.652794361114502},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6155533194541931},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.6009277701377869},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5778043270111084},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.5759173631668091},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5406851172447205},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5180408954620361},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5029904246330261},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49592718482017517},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4805762767791748},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.46441859006881714},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4568619728088379}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8603675365447998},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7987403273582458},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.652794361114502},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6155533194541931},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.6009277701377869},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5778043270111084},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.5759173631668091},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5406851172447205},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5180408954620361},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5029904246330261},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49592718482017517},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4805762767791748},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.46441859006881714},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4568619728088379},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2020-1242","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2020-1242","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2020","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2002.12764","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.12764","pdf_url":"https://arxiv.org/pdf/2002.12764","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2002.12764","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2002.12764","pdf_url":"https://arxiv.org/pdf/2002.12764","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.5199999809265137,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W105569935","https://openalex.org/W1608367484","https://openalex.org/W2030931454","https://openalex.org/W2085662862","https://openalex.org/W2101234009","https://openalex.org/W2148154194","https://openalex.org/W2149933564","https://openalex.org/W2165698076","https://openalex.org/W2396589722","https://openalex.org/W2513507089","https://openalex.org/W2526050071","https://openalex.org/W2593116425","https://openalex.org/W2612445135","https://openalex.org/W2620629206","https://openalex.org/W2726515241","https://openalex.org/W2767754137","https://openalex.org/W2772935161","https://openalex.org/W2773070064","https://openalex.org/W2797583228","https://openalex.org/W2842511635","https://openalex.org/W2887280559","https://openalex.org/W2923014074","https://openalex.org/W2941715400","https://openalex.org/W2944200841","https://openalex.org/W2950007391","https://openalex.org/W2951828005","https://openalex.org/W2952558884","https://openalex.org/W2953360861","https://openalex.org/W2962839749","https://openalex.org/W2963087613","https://openalex.org/W2963194800","https://openalex.org/W2963300719","https://openalex.org/W2963310665","https://openalex.org/W2964013315","https://openalex.org/W2964317695","https://openalex.org/W2972943112","https://openalex.org/W2973157397","https://openalex.org/W2977259558","https://openalex.org/W2980287048","https://openalex.org/W2984843443","https://openalex.org/W2994728585","https://openalex.org/W2995254904","https://openalex.org/W2996158613","https://openalex.org/W2998249245","https://openalex.org/W3016011332","https://openalex.org/W3094550259","https://openalex.org/W3099206234","https://openalex.org/W3108131700","https://openalex.org/W4297775537","https://openalex.org/W4297808394","https://openalex.org/W4299518610","https://openalex.org/W4394655213"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W2028665553","https://openalex.org/W2086519370","https://openalex.org/W972276598","https://openalex.org/W2087343574","https://openalex.org/W2440023763","https://openalex.org/W2962474440"],"abstract_inverted_index":{"The":[0,24,66,87,113],"ultimate":[1],"goal":[2],"of":[3,83,103],"transfer":[4,84],"learning":[5,85],"is":[6,89,98],"to":[7,32,41],"reduce":[8],"labeled":[9],"data":[10],"requirements":[11],"by":[12],"exploiting":[13],"a":[14,47,58,81,92,101],"pre-existing":[15],"embedding":[16,88],"model":[17],"trained":[18,90],"for":[19,49],"different":[20],"datasets":[21],"or":[22],"tasks.":[23,86],"visual":[25],"and":[26,56,75,96,110,116],"language":[27],"communities":[28],"have":[29],"established":[30],"benchmarks":[31],"compare":[33],"embeddings,":[34],"but":[35],"the":[36,73],"speech":[37,51],"community":[38],"has":[39],"yet":[40],"do":[42],"so.":[43],"This":[44],"paper":[45],"proposes":[46,57],"benchmark":[48],"comparing":[50],"representations":[52,71],"on":[53,61,72,80,91,100],"non-semantic":[54],"tasks,":[55,106],"representation":[59,68],"based":[60],"an":[62],"unsupervised":[63],"triplet-loss":[64],"objective.":[65],"proposed":[67],"outperforms":[69],"other":[70],"benchmark,":[74,114],"even":[76],"exceeds":[77],"state-of-the-art":[78],"performance":[79],"number":[82],"publicly":[93,120],"available":[94],"dataset,":[95],"it":[97],"tested":[99],"variety":[102],"low-resource":[104],"downstream":[105],"including":[107],"personalization":[108],"tasks":[109],"medical":[111],"domain.":[112],"models,":[115],"evaluation":[117],"code":[118],"are":[119],"released.":[121]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":23},{"year":2023,"cited_by_count":33},{"year":2022,"cited_by_count":32},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-13T07:58:08.660418","created_date":"2025-10-10T00:00:00"}
