{"id":"https://openalex.org/W3016012197","doi":"https://doi.org/10.1145/3377851","title":"Improving Neural Machine Translation with Linear Interpolation of a Short-Path Unit","display_name":"Improving Neural Machine Translation with Linear Interpolation of a Short-Path Unit","publication_year":2020,"publication_date":"2020-02-07","ids":{"openalex":"https://openalex.org/W3016012197","doi":"https://doi.org/10.1145/3377851","mag":"3016012197"},"language":"en","primary_location":{"id":"doi:10.1145/3377851","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377851","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101701181","display_name":"Yachao Li","orcid":"https://orcid.org/0000-0002-9423-9922"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yachao Li","raw_affiliation_strings":["Harbin Institute of Technology","Soochow University 8 Northwest Minzu University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Soochow University 8 Northwest Minzu University","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100369260","display_name":"Junhui Li","orcid":"https://orcid.org/0000-0001-7829-6348"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junhui Li","raw_affiliation_strings":["Soochow University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Soochow University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100402911","display_name":"Min Zhang","orcid":"https://orcid.org/0000-0002-3895-5510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Min Zhang","raw_affiliation_strings":["Soochow University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Soochow University","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100459836","display_name":"Yixin Li","orcid":"https://orcid.org/0009-0002-9290-5300"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixin Li","raw_affiliation_strings":["Harbin Institute of Technology","Soochow University 8 Northwest Minzu University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Soochow University 8 Northwest Minzu University","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010898755","display_name":"Peng Zou","orcid":"https://orcid.org/0000-0002-8484-5769"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Zou","raw_affiliation_strings":["Harbin Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8125,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.78544818,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"19","issue":"3","first_page":"1","last_page":"16"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9805999994277954,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7308081388473511},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.602959156036377},{"id":"https://openalex.org/keywords/linear-interpolation","display_name":"Linear interpolation","score":0.5956071615219116},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5900651812553406},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5641341209411621},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5462803244590759},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5112795829772949},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.505990207195282},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5032615065574646},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48516756296157837},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.42940017580986023},{"id":"https://openalex.org/keywords/linear-model","display_name":"Linear model","score":0.4254534840583801},{"id":"https://openalex.org/keywords/association","display_name":"Association (psychology)","score":0.4236676096916199},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.40883952379226685},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.37835657596588135},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33275026082992554},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.18425938487052917},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15797823667526245},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.10061466693878174},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.07708510756492615}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7308081388473511},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.602959156036377},{"id":"https://openalex.org/C171836373","wikidata":"https://www.wikidata.org/wiki/Q2266329","display_name":"Linear interpolation","level":3,"score":0.5956071615219116},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5900651812553406},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5641341209411621},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5462803244590759},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5112795829772949},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.505990207195282},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5032615065574646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48516756296157837},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.42940017580986023},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.4254534840583801},{"id":"https://openalex.org/C142853389","wikidata":"https://www.wikidata.org/wiki/Q744778","display_name":"Association (psychology)","level":2,"score":0.4236676096916199},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.40883952379226685},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.37835657596588135},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33275026082992554},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.18425938487052917},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15797823667526245},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.10061466693878174},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.07708510756492615},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3377851","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3377851","pdf_url":null,"source":{"id":"https://openalex.org/S4306421405","display_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","issn_l":"2375-4699","issn":["2375-4699","2375-4702"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Asian and Low-Resource Language Information Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[{"id":"https://openalex.org/G2167325965","display_name":null,"funder_award_id":"61525205 and 61876120","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1902237438","https://openalex.org/W1916589227","https://openalex.org/W2064675550","https://openalex.org/W2101105183","https://openalex.org/W2107878631","https://openalex.org/W2156985047","https://openalex.org/W2157331557","https://openalex.org/W2194775991","https://openalex.org/W2241862190","https://openalex.org/W2252272516","https://openalex.org/W2292919134","https://openalex.org/W2483327705","https://openalex.org/W2552839021","https://openalex.org/W2572403989","https://openalex.org/W2798761464","https://openalex.org/W2888520903","https://openalex.org/W2930957955","https://openalex.org/W2962784628","https://openalex.org/W2962886257","https://openalex.org/W2963260202","https://openalex.org/W2963599677","https://openalex.org/W2963631431","https://openalex.org/W2963913268","https://openalex.org/W2963991316","https://openalex.org/W2964298349","https://openalex.org/W2965575120","https://openalex.org/W2998243336","https://openalex.org/W4299828299"],"related_works":["https://openalex.org/W3183609115","https://openalex.org/W2387056800","https://openalex.org/W2389908107","https://openalex.org/W2108850688","https://openalex.org/W2354295809","https://openalex.org/W2532653122","https://openalex.org/W2359833404","https://openalex.org/W1994390986","https://openalex.org/W2378343395","https://openalex.org/W2322862099"],"abstract_inverted_index":{"In":[0,82,110],"neural":[1,19,49],"machine":[2],"translation":[3,181,194],"(NMT),":[4],"the":[5,12,41,44,55,92,145,185,192,212,220],"source":[6,58,67,95,129,134,146,215],"and":[7,51,60,96,154,178,199,216,234],"target":[8,75,97,217],"words":[9,59,98],"are":[10],"at":[11],"two":[13],"ends":[14],"of":[15,26,43,78,94,167,188,214],"a":[16,24,47,64,66,74],"large":[17],"deep":[18,48],"network,":[20,50],"normally":[21],"mediated":[22],"by":[23,99,196],"series":[25],"non-linear":[27,34],"activations.":[28],"The":[29],"problem":[30],"with":[31,118,125,141,160],"such":[32],"consequent":[33],"activations":[35],"is":[36,229],"that":[37,184,207,225],"they":[38],"significantly":[39,190],"decrease":[40],"magnitude":[42],"gradient":[45],"in":[46,232],"thus":[52],"gradually":[53],"loosen":[54],"interaction":[56],"between":[57],"their":[61],"translations.":[62],"As":[63],"result,":[65],"word":[68,76,130],"may":[69],"be":[70],"incorrectly":[71],"translated":[72],"into":[73,133,171],"out":[77],"its":[79],"translational":[80],"equivalents.":[81],"this":[83],"article,":[84],"we":[85,112,222],"propose":[86],"short-path":[87],"units":[88],"(SPUs)":[89],"to":[90,150],"strengthen":[91,211],"association":[93,213],"allowing":[100],"information":[101],"flow":[102,149],"over":[103],"adjacent":[104],"layers":[105],"effectively":[106],"via":[107],"linear":[108,165,186],"interpolation.":[109],"particular,":[111],"enrich":[113],"three":[114],"critical":[115],"NMT":[116],"components":[117],"SPUs:":[119],"(1)":[120],"an":[121,137,156],"enriched":[122,138,157],"encoding":[123],"model":[124,140,159,228],"SPU,":[126,142,161],"which":[127,143,162],"interpolates":[128],"embeddings":[131],"linearly":[132,148],"annotations;":[135],"(2)":[136],"decoding":[139],"enables":[144],"context":[147],"target-side":[151,168],"hidden":[152,169],"states;":[153],"(3)":[155],"output":[158,172],"further":[163],"allows":[164],"interpolation":[166,187],"states":[170],"states.":[173],"Experimentation":[174],"on":[175],"Chinese-to-English,":[176],"English-to-German,":[177],"low-resource":[179,235],"Tibetan-to-Chinese":[180],"tasks":[182],"demonstrates":[183],"SPUs":[189],"improves":[191],"overall":[193],"quality":[195],"1.88,":[197],"1.43,":[198],"3.75":[200],"BLEU,":[201],"respectively.":[202],"Moreover,":[203],"detailed":[204],"analysis":[205],"shows":[206],"our":[208,226],"approaches":[209],"much":[210],"words.":[218],"From":[219],"preceding,":[221],"can":[223],"see":[224],"proposed":[227],"effective":[230],"both":[231],"rich-":[233],"scenarios.":[236]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
