{"id":"https://openalex.org/W7092291090","doi":"https://doi.org/10.48550/arxiv.2510.13871","title":"Quechua Speech Datasets in Common Voice: The Case of Puno Quechua","display_name":"Quechua Speech Datasets in Common Voice: The Case of Puno Quechua","publication_year":2025,"publication_date":"2025-10-13","ids":{"openalex":"https://openalex.org/W7092291090","doi":"https://doi.org/10.48550/arxiv.2510.13871"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2510.13871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2510.13871","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Huaman, Elwin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huaman, Elwin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Huaman, Wendi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huaman, Wendi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Huaman, Jorge Luis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huaman, Jorge Luis","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Quispe, Ninfa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quispe, Ninfa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.8420000076293945,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13194","display_name":"ICT in Developing Communities","score":0.8420000076293945,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13996","display_name":"Diverse Musicological Studies","score":0.01489999983459711,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/indigenous","display_name":"Indigenous","score":0.6855999827384949},{"id":"https://openalex.org/keywords/empowerment","display_name":"Empowerment","score":0.4214000105857849},{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.4088999927043915},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3903000056743622},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.37059998512268066}],"concepts":[{"id":"https://openalex.org/C55958113","wikidata":"https://www.wikidata.org/wiki/Q169480","display_name":"Indigenous","level":2,"score":0.6855999827384949},{"id":"https://openalex.org/C20555606","wikidata":"https://www.wikidata.org/wiki/Q868575","display_name":"Empowerment","level":2,"score":0.4214000105857849},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3903000056743622},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.34549999237060547},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.3212999999523163},{"id":"https://openalex.org/C2781370049","wikidata":"https://www.wikidata.org/wiki/Q645304","display_name":"Indigenous language","level":3,"score":0.3203999996185303},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.3005000054836273},{"id":"https://openalex.org/C2549261","wikidata":"https://www.wikidata.org/wiki/Q43455","display_name":"Ethnology","level":1,"score":0.2856000065803528},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2623000144958496}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2510.13871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2510.13871","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13871","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7208861708641052}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Under-resourced":[0],"languages,":[1,52],"such":[2],"as":[3,59],"Quechuas,":[4],"face":[5],"data":[6,123],"and":[7,30,68,74,121,132],"resource":[8],"scarcity,":[9],"hindering":[10],"their":[11],"development":[12],"in":[13],"speech":[14,32,76,90],"technology.":[15],"To":[16],"address":[17],"this":[18],"issue,":[19],"Common":[20,44,82,103],"Voice":[21,83],"presents":[22],"a":[23,60,109],"crucial":[24],"opportunity":[25],"to":[26],"foster":[27],"an":[28],"open":[29],"community-driven":[31],"dataset":[33],"creation.":[34],"This":[35],"paper":[36],"examines":[37],"the":[38,48,102],"integration":[39],"of":[40,71,88,135],"Quechua":[41,51,55,89,95],"languages":[42],"into":[43],"Voice.":[45],"We":[46,106],"detail":[47],"current":[49],"17":[50],"presenting":[53],"Puno":[54,94],"(ISO":[56],"639-3:":[57],"qxp)":[58],"focused":[61],"case":[62],"study":[63],"that":[64,81],"includes":[65],"language":[66,137],"onboarding":[67],"corpus":[69],"collection":[70],"both":[72],"reading":[73],"spontaneous":[75],"data.":[77],"Our":[78,125],"results":[79],"demonstrate":[80],"now":[84],"hosts":[85],"191.1":[86],"hours":[87,98],"(86\\%":[91],"validated),":[92,100],"with":[93],"contributing":[96],"12":[97],"(77\\%":[99],"highlighting":[101],"Voice's":[104],"potential.":[105],"further":[107],"propose":[108],"research":[110],"agenda":[111],"addressing":[112],"technical":[113],"challenges,":[114],"alongside":[115],"ethical":[116],"considerations":[117],"for":[118],"community":[119],"engagement":[120],"indigenous":[122],"sovereignty.":[124],"work":[126],"contributes":[127],"towards":[128],"inclusive":[129],"voice":[130],"technology":[131],"digital":[133],"empowerment":[134],"under-resourced":[136],"communities.":[138]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-18T00:00:00"}
