{"id":"https://openalex.org/W2758994255","doi":"https://doi.org/10.18653/v1/w17-4007","title":"Word Transduction for Addressing the OOV Problem in Machine Translation for Similar Resource-Scarce Languages","display_name":"Word Transduction for Addressing the OOV Problem in Machine Translation for Similar Resource-Scarce Languages","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2758994255","doi":"https://doi.org/10.18653/v1/w17-4007","mag":"2758994255"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w17-4007","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4007","pdf_url":"https://www.aclweb.org/anthology/W17-4007.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Finite State\n          Methods and Natural Language Processing (FSMNLP 2017)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W17-4007.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110306829","display_name":"Shashikant Sharma","orcid":null},"institutions":[{"id":"https://openalex.org/I56404289","display_name":"Indian Institute of Technology BHU","ror":"https://ror.org/01kh5gc44","country_code":"IN","type":"education","lineage":["https://openalex.org/I56404289"]},{"id":"https://openalex.org/I91357014","display_name":"Banaras Hindu University","ror":"https://ror.org/04cdn2797","country_code":"IN","type":"education","lineage":["https://openalex.org/I91357014"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Shashikant Sharma","raw_affiliation_strings":["IIT (BHU), Varanasi, India"],"affiliations":[{"raw_affiliation_string":"IIT (BHU), Varanasi, India","institution_ids":["https://openalex.org/I56404289","https://openalex.org/I91357014"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015174369","display_name":"Anil Kumar Singh","orcid":"https://orcid.org/0000-0001-7177-5901"},"institutions":[{"id":"https://openalex.org/I91357014","display_name":"Banaras Hindu University","ror":"https://ror.org/04cdn2797","country_code":"IN","type":"education","lineage":["https://openalex.org/I91357014"]},{"id":"https://openalex.org/I56404289","display_name":"Indian Institute of Technology BHU","ror":"https://ror.org/01kh5gc44","country_code":"IN","type":"education","lineage":["https://openalex.org/I56404289"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Anil Kumar Singh","raw_affiliation_strings":["IIT (BHU), Varanasi, India"],"affiliations":[{"raw_affiliation_string":"IIT (BHU), Varanasi, India","institution_ids":["https://openalex.org/I56404289","https://openalex.org/I91357014"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5110306829"],"corresponding_institution_ids":["https://openalex.org/I56404289","https://openalex.org/I91357014"],"apc_list":null,"apc_paid":null,"fwci":0.7801,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.79697887,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"56","last_page":"63"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.831899881362915},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6846308708190918},{"id":"https://openalex.org/keywords/transduction","display_name":"Transduction (biophysics)","score":0.6687953472137451},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6489188075065613},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6408722400665283},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.6252879500389099},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.6224185228347778},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5674858093261719},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.4902990162372589},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.48277679085731506},{"id":"https://openalex.org/keywords/phonology","display_name":"Phonology","score":0.46133506298065186},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.4214790463447571},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3510451018810272},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.20169278979301453},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08207538723945618}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.831899881362915},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6846308708190918},{"id":"https://openalex.org/C15152581","wikidata":"https://www.wikidata.org/wiki/Q7833966","display_name":"Transduction (biophysics)","level":2,"score":0.6687953472137451},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6489188075065613},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6408722400665283},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.6252879500389099},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.6224185228347778},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5674858093261719},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.4902990162372589},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.48277679085731506},{"id":"https://openalex.org/C148934300","wikidata":"https://www.wikidata.org/wiki/Q40998","display_name":"Phonology","level":2,"score":0.46133506298065186},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.4214790463447571},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3510451018810272},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.20169278979301453},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08207538723945618},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w17-4007","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4007","pdf_url":"https://www.aclweb.org/anthology/W17-4007.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Finite State\n          Methods and Natural Language Processing (FSMNLP 2017)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w17-4007","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w17-4007","pdf_url":"https://www.aclweb.org/anthology/W17-4007.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th International Conference on Finite State\n          Methods and Natural Language Processing (FSMNLP 2017)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2758994255.pdf","grobid_xml":"https://content.openalex.org/works/W2758994255.grobid-xml"},"referenced_works_count":15,"referenced_works":["https://openalex.org/W16967297","https://openalex.org/W1971652730","https://openalex.org/W2042987798","https://openalex.org/W2072088932","https://openalex.org/W2101105183","https://openalex.org/W2113788796","https://openalex.org/W2124807415","https://openalex.org/W2135532889","https://openalex.org/W2152134037","https://openalex.org/W2156985047","https://openalex.org/W2172208814","https://openalex.org/W2322728950","https://openalex.org/W2408555016","https://openalex.org/W2595715041","https://openalex.org/W2740141831"],"related_works":["https://openalex.org/W4289914452","https://openalex.org/W2890433954","https://openalex.org/W2384400852","https://openalex.org/W3204898214","https://openalex.org/W2963259630","https://openalex.org/W4240926580","https://openalex.org/W2070920720","https://openalex.org/W2122294272","https://openalex.org/W2398549619","https://openalex.org/W1542743110"],"abstract_inverted_index":{"Similar":[0],"languages":[1],"have":[2,74],"a":[3,30,91,112,123],"large":[4],"number":[5],"of":[6,42,67,86,110,153],"cognate":[7],"words":[8,18,88,142],"which":[9,70],"can":[10,78,136],"be":[11,96,138],"exploited":[12],"to":[13,50,63,80,140,150],"deal":[14],"with":[15],"Out-Of-Vocabulary":[16],"(OOV)":[17],"problem.":[19,38],"This":[20,94],"problem":[21],"is":[22,48,60,132],"especially":[23],"severe":[24],"for":[25,32,35,56,107,119],"resource-scarce":[26],"languages.":[27],"We":[28,39,77,104],"propose":[29],"method":[31],"'word":[33],"transduction'":[34],"addressing":[36],"this":[37],"take":[40],"advantage":[41],"the":[43,151,154],"fact":[44],"that,":[45,106],"although":[46],"it":[47,59],"difficult":[49],"prepare":[51,64],"sentence":[52],"aligned":[53],"parallel":[54,92],"corpus":[55],"such":[57,90],"languages,":[58],"much":[61],"easier":[62],"'parallel'":[65],"list":[66],"word":[68,134],"pairs":[69],"are":[71],"cognates":[72],"and":[73,147],"similar":[75,145],"pronunciations.":[76],"try":[79],"learn":[81],"pronunciations":[82],"(or":[83],"orthographic":[84],"representations)":[85],"OOV":[87],"from":[89,143],"list.":[93],"could":[95],"done":[97],"by":[98],"using":[99],"phrase-based":[100],"machine":[101],"translation":[102],"(PBMT).":[103],"show":[105],"small":[108],"amount":[109],"data,":[111],"model":[113],"based":[114],"on":[115],"weighted":[116],"rewrite":[117],"rules":[118],"phoneme":[120],"chunks":[121],"outperforms":[122],"PBMT-based":[124],"approach.":[125],"An":[126],"additional":[127],"point":[128],"that":[129,133],"we":[130],"make":[131],"transduction":[135],"also":[137],"used":[139],"borrow":[141],"another":[144],"language":[146],"adapt":[148],"them":[149],"phonology":[152],"target":[155],"language.":[156]},"counts_by_year":[{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
