{"id":"https://openalex.org/W3117249014","doi":"https://doi.org/10.18653/v1/2020.coling-main.163","title":"Detecting de minimis Code-Switching in Historical German Books","display_name":"Detecting de minimis Code-Switching in Historical German Books","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3117249014","doi":"https://doi.org/10.18653/v1/2020.coling-main.163","mag":"3117249014"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2020.coling-main.163","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.163","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.163.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/2020.coling-main.163.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052558807","display_name":"Shijia Liu","orcid":"https://orcid.org/0000-0001-6634-4808"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shijia Liu","raw_affiliation_strings":["College of Computer Sciences Northeastern University"],"affiliations":[{"raw_affiliation_string":"College of Computer Sciences Northeastern University","institution_ids":["https://openalex.org/I12912129"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101722493","display_name":"David A. Smith","orcid":"https://orcid.org/0000-0002-6636-6940"},"institutions":[{"id":"https://openalex.org/I12912129","display_name":"Northeastern University","ror":"https://ror.org/04t5xt781","country_code":"US","type":"education","lineage":["https://openalex.org/I12912129"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Smith","raw_affiliation_strings":["College of Computer Sciences Northeastern University"],"affiliations":[{"raw_affiliation_string":"College of Computer Sciences Northeastern University","institution_ids":["https://openalex.org/I12912129"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5052558807"],"corresponding_institution_ids":["https://openalex.org/I12912129"],"apc_list":null,"apc_paid":null,"fwci":0.2651,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.65078308,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1808","last_page":"1814"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11640","display_name":"Linguistic Variation and Morphology","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/3310","display_name":"Linguistics and Language"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code-switching","display_name":"Code-switching","score":0.8837541341781616},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8477755784988403},{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.81890469789505},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5933485627174377},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.552684485912323},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5440995693206787},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.49578604102134705},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3435537815093994},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.27978333830833435},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.23027122020721436}],"concepts":[{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.8837541341781616},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8477755784988403},{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.81890469789505},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5933485627174377},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.552684485912323},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5440995693206787},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.49578604102134705},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3435537815093994},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.27978333830833435},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.23027122020721436},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2020.coling-main.163","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.163","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.163.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2020.coling-main.163","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2020.coling-main.163","pdf_url":"https://www.aclweb.org/anthology/2020.coling-main.163.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 28th International Conference on Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3117249014.pdf","grobid_xml":"https://content.openalex.org/works/W3117249014.grobid-xml"},"referenced_works_count":25,"referenced_works":["https://openalex.org/W308745112","https://openalex.org/W1973253288","https://openalex.org/W2101234009","https://openalex.org/W2114569717","https://openalex.org/W2130942839","https://openalex.org/W2139645402","https://openalex.org/W2145867197","https://openalex.org/W2188330943","https://openalex.org/W2251149908","https://openalex.org/W2252113950","https://openalex.org/W2516994063","https://openalex.org/W2562065833","https://openalex.org/W2619780982","https://openalex.org/W2747481658","https://openalex.org/W2774217579","https://openalex.org/W2886146035","https://openalex.org/W2886890203","https://openalex.org/W2887116241","https://openalex.org/W2928484296","https://openalex.org/W2954064526","https://openalex.org/W3032020872","https://openalex.org/W3043096572","https://openalex.org/W4237155282","https://openalex.org/W4255065514","https://openalex.org/W4288408927"],"related_works":["https://openalex.org/W2771594921","https://openalex.org/W4389976243","https://openalex.org/W2432897346","https://openalex.org/W2065387230","https://openalex.org/W2181336723","https://openalex.org/W3158134258","https://openalex.org/W2323937687","https://openalex.org/W648995381","https://openalex.org/W3033791384","https://openalex.org/W3138119129"],"abstract_inverted_index":{"Code-switching":[0],"has":[1],"long":[2],"interested":[3],"linguists,":[4],"with":[5,138],"computational":[6],"work":[7],"in":[8,28,38,74,85,90,115],"particular":[9],"focusing":[10],"on":[11],"speech":[12,94,130],"and":[13,59,72,88,95],"social":[14,96],"media":[15,97],"data":[16],"This":[17],"paper":[18],"contrasts":[19],"these":[20,86],"informal":[21],"instances":[22],"of":[23,36,45,63,105,110],"code-switching":[24,83,107],"to":[25,53,134],"its":[26],"appearance":[27],"more":[29,91],"formal":[30],"registers,":[31],"by":[32],"examining":[33],"the":[34,39,51,75,80,102,111,116],"mixture":[35],"languages":[37,66],"Deutsches":[40],"Textarchiv":[41],"(DTA),":[42],"a":[43,135],"corpus":[44,137],"1406":[46],"primarily":[47],"German":[48],"books":[49,87],"from":[50,108],"17th":[52],"19th":[54],"centuries.":[55],"We":[56,77],"automatically":[57],"annotate":[58],"manually":[60],"inspect":[61],"spans":[62],"six":[64],"embedded":[65,140],"(Latin,":[67],"French,":[68],"English,":[69],"Italian,":[70],"Spanish,":[71],"Greek)":[73],"corpus.":[76,118],"quantitatively":[78],"analyze":[79],"differences":[81],"between":[82],"patterns":[84],"those":[89],"typically":[92],"studied":[93],"corpora.":[98],"Furthermore,":[99],"we":[100],"address":[101],"practical":[103],"task":[104],"predicting":[106],"features":[109],"matrix":[112],"language":[113],"alone":[114],"DTA":[117],"Such":[119],"classifiers":[120],"can":[121],"help":[122],"reduce":[123],"errors":[124],"when":[125],"optical":[126],"character":[127],"recognition":[128],"or":[129],"transcription":[131],"is":[132],"applied":[133],"large":[136],"rare":[139],"languages.":[141]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
