{"id":"https://openalex.org/W2280950113","doi":"https://doi.org/10.1186/s13636-016-0081-1","title":"Grid-based approximation for voice conversion in low resource environments","display_name":"Grid-based approximation for voice conversion in low resource environments","publication_year":2016,"publication_date":"2016-01-21","ids":{"openalex":"https://openalex.org/W2280950113","doi":"https://doi.org/10.1186/s13636-016-0081-1","mag":"2280950113"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-016-0081-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-016-0081-1","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-016-0081-1","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-016-0081-1","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029174249","display_name":"Hadas Benisty","orcid":"https://orcid.org/0000-0001-6308-2267"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":true,"raw_author_name":"Hadas Benisty","raw_affiliation_strings":["Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009813683","display_name":"D. Malah","orcid":"https://orcid.org/0009-0001-8310-7844"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"David Malah","raw_affiliation_strings":["Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006419939","display_name":"Koby Crammer","orcid":"https://orcid.org/0000-0001-8824-5747"},"institutions":[{"id":"https://openalex.org/I174306211","display_name":"Technion \u2013 Israel Institute of Technology","ror":"https://ror.org/03qryx823","country_code":"IL","type":"education","lineage":["https://openalex.org/I174306211"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Koby Crammer","raw_affiliation_strings":["Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering Department, Technion\u2013Israel Institute of Technology, Technion City, Haifa, Israel","institution_ids":["https://openalex.org/I174306211"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5029174249"],"corresponding_institution_ids":["https://openalex.org/I174306211"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":0.5044,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.61450518,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"2016","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8127325177192688},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6477912664413452},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.6031616926193237},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.5516730546951294},{"id":"https://openalex.org/keywords/smoothing","display_name":"Smoothing","score":0.5475212335586548},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4508098363876343},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37028968334198},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36778879165649414},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.32012826204299927},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.13932079076766968},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.1174885630607605}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8127325177192688},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6477912664413452},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.6031616926193237},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.5516730546951294},{"id":"https://openalex.org/C3770464","wikidata":"https://www.wikidata.org/wiki/Q775963","display_name":"Smoothing","level":2,"score":0.5475212335586548},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4508098363876343},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37028968334198},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36778879165649414},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32012826204299927},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.13932079076766968},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.1174885630607605},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1186/s13636-016-0081-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-016-0081-1","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-016-0081-1","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1186/s13636-016-0081-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-016-0081-1","pdf_url":"https://asmp-eurasipjournals.springeropen.com/track/pdf/10.1186/s13636-016-0081-1","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.4099999964237213}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2280950113.pdf","grobid_xml":"https://content.openalex.org/works/W2280950113.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W142801778","https://openalex.org/W190419602","https://openalex.org/W1491561031","https://openalex.org/W1526513105","https://openalex.org/W1588266896","https://openalex.org/W1970763740","https://openalex.org/W1977362459","https://openalex.org/W1997282645","https://openalex.org/W2011916518","https://openalex.org/W2032130465","https://openalex.org/W2045026634","https://openalex.org/W2049633694","https://openalex.org/W2114659828","https://openalex.org/W2120605154","https://openalex.org/W2121387787","https://openalex.org/W2123003832","https://openalex.org/W2135869853","https://openalex.org/W2136166660","https://openalex.org/W2145130307","https://openalex.org/W2156142001","https://openalex.org/W2156477760","https://openalex.org/W2160337655","https://openalex.org/W2161476805","https://openalex.org/W2227610995","https://openalex.org/W2293807537","https://openalex.org/W2295406225","https://openalex.org/W2406654659","https://openalex.org/W2408732577","https://openalex.org/W2943553228","https://openalex.org/W6601579809","https://openalex.org/W6601724703"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2939490483","https://openalex.org/W2387604097","https://openalex.org/W2787035864","https://openalex.org/W2373675101","https://openalex.org/W2038216521","https://openalex.org/W4385672897","https://openalex.org/W2736574136","https://openalex.org/W1996938627"],"abstract_inverted_index":{"The":[0,152,184,208],"goal":[1],"of":[2,39,53,71,84,105,173,199,214,228,244,275,291,325],"voice":[3],"conversion":[4,22,136,164,294],"is":[5,119,144,155,166,222],"to":[6,12,33,55,62,68,121,239,266,273,279,288,313],"modify":[7],"a":[8,18,111,115,169,196,326],"source":[9,41,182],"speaker\u2019s":[10],"speech":[11],"sound":[13],"as":[14,114,168,205,310],"if":[15],"spoken":[16],"by":[17,161,249,303],"target":[19,43,176,201,277,315],"speaker.":[20],"Common":[21],"methods":[23],"are":[24,77,192,308],"based":[25,156,178],"on":[26,157,179],"Gaussian":[27],"mixture":[28],"modeling":[29],"(GMM).":[30],"They":[31],"aim":[32],"statistically":[34],"model":[35],"the":[36,40,72,103,133,163,175,180,200,218,241,245,250,253,276,284,292,304,314,318,323,330],"spectral":[37,73,281],"structure":[38],"and":[42,45,89,96,221,252,278],"signals":[44,247,301],"require":[46],"relatively":[47],"large":[48],"training":[49,85,107,202,209,219,231,259],"sets":[50],"(typically":[51],"dozens":[52],"sentences)":[54],"avoid":[56],"over-fitting.":[57],"Moreover,":[58],"they":[59],"often":[60],"lead":[61],"muffled":[63],"synthesized":[64,246],"output":[65],"signals,":[66,321],"due":[67],"excessive":[69],"smoothing":[70],"envelopes.":[74],"Mobile":[75],"applications":[76],"characterized":[78],"with":[79],"low":[80,140],"resources":[81],"in":[82,226,329],"terms":[83],"data,":[86],"memory":[87,97],"footprint,":[88],"computational":[90,95],"complexity.":[91],"As":[92],"technology":[93],"advances,":[94],"requirements":[98],"become":[99],"less":[100],"limiting;":[101],"however,":[102],"amount":[104],"available":[106],"data":[108],"still":[109],"presents":[110],"great":[112],"challenge,":[113],"typical":[116],"mobile":[117],"user":[118],"willing":[120],"record":[122],"himself":[123],"saying":[124],"just":[125,257],"few":[126,149],"sentences.":[127],"In":[128],"this":[129],"paper,":[130],"we":[131],"propose":[132],"grid-based":[134],"(GB)":[135],"method":[137,264,307],"for":[138],"such":[139],"resource":[141],"environments,":[142],"which":[143,162],"successfully":[145],"trained":[146],"using":[147,195],"very":[148,229],"sentences":[150,268],"(5\u201310).":[151],"GB":[153,263,306],"approach":[154],"sequential":[158,170],"Bayesian":[159],"tracking,":[160],"process":[165,210],"expressed":[167],"estimation":[171],"problem":[172],"tracking":[174],"spectrum":[177],"observed":[181],"spectrum.":[183],"converted":[185,267],"Mel":[186],"frequency":[187],"cepstrum":[188],"coefficient":[189],"(MFCC)":[190],"vectors":[191,203,220],"sequentially":[193],"evaluated":[194],"weighted":[197],"sum":[198],"used":[204],"grid":[206],"points.":[207],"includes":[211],"simple":[212],"computations":[213],"Euclidian":[215],"distances":[216,282],"between":[217],"easily":[223],"performed":[224],"even":[225],"cases":[227],"small":[230,327],"sets.":[232],"We":[233],"use":[234],"global":[235],"variance":[236],"(GV)":[237],"enhancement":[238],"improve":[240],"perceived":[242,309,331],"quality":[243],"obtained":[248],"proposed":[251],"GMM-based":[254,293],"methods.":[255],"Using":[256],"10":[258],"sentences,":[260],"our":[261],"enhanced":[262,289,305,319],"leads":[265],"having":[269],"closer":[270],"GV":[271],"values":[272],"those":[274],"lower":[280],"at":[283,322],"same":[285],"time,":[286],"compared":[287],"version":[290],"method.":[295],"Furthermore,":[296],"subjective":[297],"evaluations":[298],"show":[299],"that":[300],"produced":[302],"more":[311],"similar":[312],"speaker":[316],"than":[317],"GMM":[320],"expense":[324],"degradation":[328],"quality.":[332]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
