{"id":"https://openalex.org/W4211190719","doi":"https://doi.org/10.1162/coli_a_00387","title":"Sparse Transcription","display_name":"Sparse Transcription","publication_year":2020,"publication_date":"2020-10-20","ids":{"openalex":"https://openalex.org/W4211190719","doi":"https://doi.org/10.1162/coli_a_00387"},"language":"en","primary_location":{"id":"doi:10.1162/coli_a_00387","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00387","pdf_url":"https://direct.mit.edu/coli/article-pdf/46/4/713/1992567/coli_a_00387.pdf","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://direct.mit.edu/coli/article-pdf/46/4/713/1992567/coli_a_00387.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026383657","display_name":"Steven Bird","orcid":"https://orcid.org/0000-0003-3782-7733"},"institutions":[{"id":"https://openalex.org/I29894533","display_name":"Charles Darwin University","ror":"https://ror.org/048zcaj52","country_code":"AU","type":"education","lineage":["https://openalex.org/I29894533"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Steven Bird","raw_affiliation_strings":["Northern Institute, Charles Darwin University. steven.bird@cdu.edu.au"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Northern Institute, Charles Darwin University. steven.bird@cdu.edu.au","institution_ids":["https://openalex.org/I29894533"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5026383657"],"corresponding_institution_ids":["https://openalex.org/I29894533"],"apc_list":null,"apc_paid":null,"fwci":1.2241,"has_fulltext":true,"cited_by_count":17,"citation_normalized_percentile":{"value":0.84808357,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"46","issue":"4","first_page":"713","last_page":"744"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8121348023414612},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.7984753847122192},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5077980160713196},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.48297563195228577},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.463541716337204},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43664902448654175},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4236016869544983},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.20394307374954224}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8121348023414612},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.7984753847122192},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5077980160713196},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.48297563195228577},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.463541716337204},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43664902448654175},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4236016869544983},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.20394307374954224},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1162/coli_a_00387","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00387","pdf_url":"https://direct.mit.edu/coli/article-pdf/46/4/713/1992567/coli_a_00387.pdf","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:b6267cfbce52417fb4dd40fe90e030c6","is_oa":false,"landing_page_url":"https://doaj.org/article/b6267cfbce52417fb4dd40fe90e030c6","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Linguistics, Vol 46, Iss 4, Pp 713-744 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/coli_a_00387","is_oa":true,"landing_page_url":"https://doi.org/10.1162/coli_a_00387","pdf_url":"https://direct.mit.edu/coli/article-pdf/46/4/713/1992567/coli_a_00387.pdf","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8299999833106995,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320993","display_name":"Charles Darwin University","ror":"https://ror.org/048zcaj52"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4211190719.pdf","grobid_xml":"https://content.openalex.org/works/W4211190719.grobid-xml"},"referenced_works_count":67,"referenced_works":["https://openalex.org/W30845872","https://openalex.org/W238053788","https://openalex.org/W785359481","https://openalex.org/W956880141","https://openalex.org/W1486364748","https://openalex.org/W1524956127","https://openalex.org/W1546890408","https://openalex.org/W1591914803","https://openalex.org/W1885617648","https://openalex.org/W1898789533","https://openalex.org/W1983888999","https://openalex.org/W1990856848","https://openalex.org/W1991303455","https://openalex.org/W2014840417","https://openalex.org/W2043199434","https://openalex.org/W2043502271","https://openalex.org/W2064699871","https://openalex.org/W2088615611","https://openalex.org/W2101105183","https://openalex.org/W2101281673","https://openalex.org/W2103147879","https://openalex.org/W2114347655","https://openalex.org/W2122228338","https://openalex.org/W2126377586","https://openalex.org/W2126449874","https://openalex.org/W2146204822","https://openalex.org/W2159625327","https://openalex.org/W2166270474","https://openalex.org/W2183100634","https://openalex.org/W2251408482","https://openalex.org/W2277634955","https://openalex.org/W2318423094","https://openalex.org/W2402112460","https://openalex.org/W2466129686","https://openalex.org/W2466918907","https://openalex.org/W2501891305","https://openalex.org/W2507826679","https://openalex.org/W2513832136","https://openalex.org/W2515167330","https://openalex.org/W2545319977","https://openalex.org/W2563850823","https://openalex.org/W2593011301","https://openalex.org/W2605131327","https://openalex.org/W2756675017","https://openalex.org/W2808682925","https://openalex.org/W2884066185","https://openalex.org/W2895097770","https://openalex.org/W2897388834","https://openalex.org/W2899134946","https://openalex.org/W2905961459","https://openalex.org/W2949410830","https://openalex.org/W2963378435","https://openalex.org/W2963620343","https://openalex.org/W2963767893","https://openalex.org/W2963819008","https://openalex.org/W2964102148","https://openalex.org/W2965383430","https://openalex.org/W2966864296","https://openalex.org/W2987701772","https://openalex.org/W3112849432","https://openalex.org/W4239270640","https://openalex.org/W4244337760","https://openalex.org/W4247270039","https://openalex.org/W4388122691","https://openalex.org/W6647171314","https://openalex.org/W6889619760","https://openalex.org/W6889634863"],"related_works":["https://openalex.org/W2374412966","https://openalex.org/W2357325779","https://openalex.org/W2357461155","https://openalex.org/W3107474891","https://openalex.org/W1978971213","https://openalex.org/W159132833","https://openalex.org/W1567338489","https://openalex.org/W38394648","https://openalex.org/W1517743118","https://openalex.org/W2322902172"],"abstract_inverted_index":{"Abstract":[0],"The":[1],"transcription":[2,85,128,135],"bottleneck":[3],"is":[4,27],"often":[5],"cited":[6],"as":[7],"a":[8,57,76,82,88,96,111],"major":[9],"obstacle":[10],"for":[11,156],"efforts":[12],"to":[13,28,41,145,153],"document":[14],"the":[15,61,130,151],"world\u2019s":[16],"endangered":[17],"languages":[18],"and":[19,35,38,46,64,87,123,139,148],"supply":[20],"them":[21],"with":[22,60,67,136],"language":[23],"technologies.":[24],"One":[25],"solution":[26],"extend":[29],"methods":[30,155],"from":[31,114],"automatic":[32],"speech":[33],"recognition":[34],"machine":[36],"translation,":[37],"recruit":[39],"linguists":[40],"provide":[42],"narrow":[43],"phonetic":[44],"transcriptions":[45],"sentence-aligned":[47],"translations.":[48],"However,":[49],"I":[50,80,105],"believe":[51],"that":[52,70,104,117,142,149],"these":[53],"approaches":[54],"are":[55,71,143],"not":[56],"good":[58],"fit":[59],"available":[62],"data":[63],"skills,":[65],"or":[66],"long-established":[68],"practices":[69],"essentially":[72],"word-based.":[73],"In":[74],"seeking":[75],"more":[77],"effective":[78],"approach,":[79],"consider":[81],"century":[83],"of":[84,91,133],"practice":[86,132],"wide":[89],"range":[90],"computational":[92,97],"approaches,":[93],"before":[94],"proposing":[95],"model":[98],"based":[99],"on":[100],"spoken":[101],"term":[102],"detection":[103],"call":[106],"\u201csparse":[107],"transcription.\u201d":[108],"This":[109],"represents":[110],"shift":[112],"away":[113],"current":[115],"assumptions":[116],"we":[118],"transcribe":[119,121,124],"phones,":[120],"fully,":[122],"first.":[125],"Instead,":[126],"sparse":[127],"combines":[129],"older":[131],"word-level":[134],"interpretive,":[137],"iterative,":[138],"interactive":[140],"processes":[141],"amenable":[144],"wider":[146],"participation":[147],"open":[150],"way":[152],"new":[154],"processing":[157],"oral":[158],"languages.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":2}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
