{"id":"https://openalex.org/W4393078878","doi":"https://doi.org/10.1109/taslp.2024.3380996","title":"Information Dropping Data Augmentation for Machine Translation Quality Estimation","display_name":"Information Dropping Data Augmentation for Machine Translation Quality Estimation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4393078878","doi":"https://doi.org/10.1109/taslp.2024.3380996"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3380996","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3380996","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025707866","display_name":"Shuo Li","orcid":"https://orcid.org/0000-0002-3488-6028"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuo Li","raw_affiliation_strings":["College of Information and Communication Engineering, Harbin Engineering University, Harbin, China"],"affiliations":[{"raw_affiliation_string":"College of Information and Communication Engineering, Harbin Engineering University, Harbin, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069980045","display_name":"Xiaojun Bi","orcid":"https://orcid.org/0000-0002-5382-1000"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojun Bi","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, China","School of Information Engineering, Minzu University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027944373","display_name":"Tao Liu","orcid":"https://orcid.org/0000-0001-5774-3428"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Liu","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University, Harbin, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University, Harbin, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100370684","display_name":"Zheng Chen","orcid":"https://orcid.org/0000-0002-9654-0997"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Chen","raw_affiliation_strings":["Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, China","School of Information Engineering, Minzu University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance of MOE, Minzu University of China, Beijing, China","institution_ids":["https://openalex.org/I145897649"]},{"raw_affiliation_string":"School of Information Engineering, Minzu University of China, Beijing, China","institution_ids":["https://openalex.org/I145897649"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5025707866"],"corresponding_institution_ids":["https://openalex.org/I151727225"],"apc_list":null,"apc_paid":null,"fwci":1.7559,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.86082961,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"32","issue":null,"first_page":"2112","last_page":"2124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.666160523891449},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5932208895683289},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.5874691605567932},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5399377942085266},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.49493759870529175},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47669264674186707},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.4554460048675537},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36298707127571106},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3587573170661926},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3525652289390564},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10886156558990479},{"id":"https://openalex.org/keywords/operations-management","display_name":"Operations management","score":0.07674944400787354},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.05190718173980713}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.666160523891449},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5932208895683289},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.5874691605567932},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5399377942085266},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.49493759870529175},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47669264674186707},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.4554460048675537},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36298707127571106},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3587573170661926},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3525652289390564},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10886156558990479},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.07674944400787354},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.05190718173980713},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2024.3380996","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3380996","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1681167796","display_name":null,"funder_award_id":"62236011","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G840016979","display_name":null,"funder_award_id":"20&ZD279","funder_id":"https://openalex.org/F4320335869","funder_display_name":"National Social Science Fund of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335869","display_name":"National Social Science Fund of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":62,"referenced_works":["https://openalex.org/W1574447377","https://openalex.org/W1910131649","https://openalex.org/W1995875735","https://openalex.org/W2021618504","https://openalex.org/W2093790824","https://openalex.org/W2101105183","https://openalex.org/W2625967005","https://openalex.org/W2905266130","https://openalex.org/W2951902588","https://openalex.org/W2954996726","https://openalex.org/W2988975212","https://openalex.org/W3035174060","https://openalex.org/W3035390927","https://openalex.org/W3036789610","https://openalex.org/W3098359110","https://openalex.org/W3103840770","https://openalex.org/W3110137956","https://openalex.org/W3114537677","https://openalex.org/W3116506157","https://openalex.org/W3119881489","https://openalex.org/W3153832840","https://openalex.org/W3171003599","https://openalex.org/W3183168437","https://openalex.org/W3201915713","https://openalex.org/W4212947519","https://openalex.org/W4281690387","https://openalex.org/W4281728254","https://openalex.org/W4285112931","https://openalex.org/W4285233909","https://openalex.org/W4312091300","https://openalex.org/W4365456683","https://openalex.org/W4382202635","https://openalex.org/W4384976358","https://openalex.org/W4385572062","https://openalex.org/W4385573073","https://openalex.org/W4385573792","https://openalex.org/W4386566861","https://openalex.org/W4387725353","https://openalex.org/W4389519461","https://openalex.org/W4389523889","https://openalex.org/W4389523919","https://openalex.org/W6681703963","https://openalex.org/W6748751219","https://openalex.org/W6749806535","https://openalex.org/W6756622823","https://openalex.org/W6774569510","https://openalex.org/W6779514328","https://openalex.org/W6784669405","https://openalex.org/W6785493912","https://openalex.org/W6786899916","https://openalex.org/W6788101155","https://openalex.org/W6790920653","https://openalex.org/W6838983741","https://openalex.org/W6843414094","https://openalex.org/W6845657128","https://openalex.org/W6846519858","https://openalex.org/W6847312029","https://openalex.org/W6849422177","https://openalex.org/W6851306619","https://openalex.org/W6857511765","https://openalex.org/W7011189617","https://openalex.org/W7028504196"],"related_works":["https://openalex.org/W3011059803","https://openalex.org/W2775554247","https://openalex.org/W2883671469","https://openalex.org/W2728761353","https://openalex.org/W2110168585","https://openalex.org/W3107474891","https://openalex.org/W2250213760","https://openalex.org/W4386247111","https://openalex.org/W4327642362","https://openalex.org/W2587014613"],"abstract_inverted_index":{"Machine":[0],"translation":[1,55,73,86,159],"quality":[2,8,96],"estimation":[3],"(QE)":[4],"refers":[5],"to":[6,40,111,127,170,183],"the":[7,67,71,76,84,94,100,104,113,146,157,162,167,176,184],"assessment":[9],"of":[10,70,154,161],"machine":[11,54],"translations":[12],"without":[13,135],"a":[14,52],"given":[15],"reference":[16],"translation.":[17],"Supervised":[18],"QE":[19,56],"models":[20],"based":[21,60,74,120],"on":[22,61,75,121],"neural":[23],"networks":[24],"have":[25],"achieved":[26],"state-of-the-art":[27],"results.":[28],"But":[29],"this":[30],"method":[31,59,119,177],"requires":[32,37],"large-scale":[33],"training":[34,133],"data,":[35],"which":[36],"bilingual":[38],"experts":[39],"create":[41],"high-quality":[42],"labels.":[43],"This":[44,116],"is":[45],"often":[46],"very":[47],"costly.":[48],"Therefore,":[49],"we":[50,65,144],"propose":[51],"sentence-level":[53],"data":[57,108],"augmentation":[58],"information":[62,69,122],"dropping.":[63],"Firstly,":[64],"calculate":[66],"subwords":[68,82],"target":[72,85],"conditional":[77],"language":[78],"model.":[79,115],"Subsequently,":[80],"some":[81],"in":[83,156],"are":[87,109],"randomly":[88],"deleted":[89],"or":[90],"replaced.":[91],"We":[92],"obtain":[93,128],"pseudo":[95],"score":[97],"by":[98,151],"calculating":[99],"remaining":[101],"information.":[102],"Finally,":[103],"original":[105],"and":[106,131],"augmented":[107],"combined":[110],"train":[112],"final":[114],"pseudo-data":[117],"generation":[118],"dropping":[123],"strategy":[124],"enables":[125],"us":[126],"more":[129],"faithful":[130],"diverse":[132],"samples":[134],"requiring":[136],"additional":[137],"corpus":[138],"resources.":[139],"Experimental":[140],"results":[141],"show":[142],"that":[143],"improve":[145],"correlation":[147],"with":[148],"human":[149],"judgment":[150],"an":[152],"average":[153],"5.96%":[155],"seven":[158],"directions":[160],"MLQE-PE":[163],"dataset,":[164],"while":[165],"improving":[166],"model's":[168],"robustness":[169],"low":[171],"adequacy":[172],"samples.":[173],"In":[174],"addition,":[175],"does":[178],"not":[179],"require":[180],"any":[181],"modifications":[182],"model":[185],"architecture.":[186]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-10T00:00:00"}
