{"id":"https://openalex.org/W4412889425","doi":"https://doi.org/10.18653/v1/2025.acl-srw.73","title":"Lost and Found: Computational Quality Assurance of Crowdsourced Knowledge on Morphological Defectivity in Wiktionary","display_name":"Lost and Found: Computational Quality Assurance of Crowdsourced Knowledge on Morphological Defectivity in Wiktionary","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412889425","doi":"https://doi.org/10.18653/v1/2025.acl-srw.73"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2025.acl-srw.73","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.73","pdf_url":"https://aclanthology.org/2025.acl-srw.73.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2025.acl-srw.73.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109819791","display_name":"Jonathan Sakunkoo","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jonathan Sakunkoo","raw_affiliation_strings":["Stanford University OHS"],"affiliations":[{"raw_affiliation_string":"Stanford University OHS","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109819792","display_name":"Annabella Sakunkoo","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Annabella Sakunkoo","raw_affiliation_strings":["Stanford University OHS"],"affiliations":[{"raw_affiliation_string":"Stanford University OHS","institution_ids":["https://openalex.org/I97018004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5109819791"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23020712,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"998","last_page":"1003"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9301999807357788,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9301999807357788,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11675","display_name":"Open Source Software Innovations","score":0.9186000227928162,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quality-assurance","display_name":"Quality assurance","score":0.7319093346595764},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.713369607925415},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5202382802963257},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.33436083793640137},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.32130900025367737},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14660048484802246},{"id":"https://openalex.org/keywords/operations-management","display_name":"Operations management","score":0.05626663565635681}],"concepts":[{"id":"https://openalex.org/C106436119","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assurance","level":3,"score":0.7319093346595764},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.713369607925415},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5202382802963257},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.33436083793640137},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32130900025367737},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14660048484802246},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.05626663565635681},{"id":"https://openalex.org/C2778618615","wikidata":"https://www.wikidata.org/wiki/Q4008393","display_name":"External quality assessment","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2025.acl-srw.73","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.73","pdf_url":"https://aclanthology.org/2025.acl-srw.73.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2025.acl-srw.73","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2025.acl-srw.73","pdf_url":"https://aclanthology.org/2025.acl-srw.73.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 63rd Annual Meeting of the Association for Computational Linguistics (Volume 4: Student Research Workshop)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320308380","display_name":"Yale University","ror":"https://ror.org/03v76x132"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412889425.pdf","grobid_xml":"https://content.openalex.org/works/W4412889425.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Morphological":[0],"defectivity":[1,185],"is":[2,17],"an":[3],"intriguing":[4],"and":[5,46,50,59,90,153,167,180],"understudied":[6],"phenomenon":[7],"in":[8,26,55,186],"linguistics.Addressing":[9],"defectivity,":[10],"where":[11],"expected":[12],"inflectional":[13],"forms":[14],"are":[15,105],"absent,":[16],"essential":[18],"for":[19,150,160,169],"improving":[20],"the":[21,65,93],"accuracy":[22],"of":[23,36,78,99,118,123,133,140,146,172,184],"NLP":[24],"tools":[25,166],"morphologically":[27,188],"rich":[28,189],"languages.However,":[29],"traditional":[30],"linguistic":[31,53,147,162,182],"resources":[32,159],"often":[33,61],"lack":[34],"coverage":[35],"morphological":[37,85,120],"gaps":[38],"as":[39,63,127,143,158],"such":[40],"knowledge":[41,183],"requires":[42],"significant":[43],"human":[44],"expertise":[45],"effort":[47],"to":[48,87],"document":[49],"verify.For":[51],"scarce":[52],"phenomena":[54,152],"under-explored":[56],"languages,":[57,154],"Wikipedia":[58],"Wiktionary":[60,104,112],"serve":[62],"among":[64],"few":[66],"accessible":[67],"resources.Despite":[68],"their":[69,72,156],"extensive":[70],"reach,":[71],"reliability":[73],"has":[74],"been":[75],"a":[76,82,114],"subject":[77],"controversy.This":[79],"study":[80],"customizes":[81],"novel":[83],"neural":[84],"analyzer":[86],"annotate":[88],"Latin":[89,124],"Italian":[91,119],"corpora.Using":[92],"massive":[94],"annotated":[95],"data,":[96,174],"crowd-sourced":[97,141,173],"lists":[98],"defective":[100,128],"verbs":[101],"compiled":[102],"from":[103],"validated":[106],"computationally.Our":[107],"results":[108],"indicate":[109],"that":[110],"while":[111],"provides":[113],"highly":[115],"reliable":[116],"account":[117],"gaps,":[121],"7%":[122],"lemmata":[125],"listed":[126],"show":[129],"strong":[130],"corpus":[131],"evidence":[132],"being":[134],"non-defective.This":[135],"discrepancy":[136],"highlights":[137],"potential":[138],"limitations":[139],"wikis":[142],"definitive":[144],"sources":[145],"knowledge,":[148],"particularly":[149],"less-studied":[151],"despite":[155],"value":[157],"rare":[161],"features.By":[163],"providing":[164],"scalable":[165],"methods":[168],"quality":[170],"assurance":[171],"this":[175],"work":[176],"advances":[177],"computational":[178],"morphology":[179],"expands":[181],"non-English,":[187],"languages.":[190]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
