{"id":"https://openalex.org/W1835075965","doi":"https://doi.org/10.3233/fi-2014-987","title":"An Efficient Framework for Extracting Parallel Sentences from Non-Parallel Corpora","display_name":"An Efficient Framework for Extracting Parallel Sentences from Non-Parallel Corpora","publication_year":2014,"publication_date":"2014-03-01","ids":{"openalex":"https://openalex.org/W1835075965","doi":"https://doi.org/10.3233/fi-2014-987","mag":"1835075965"},"language":"en","primary_location":{"id":"doi:10.3233/fi-2014-987","is_oa":false,"landing_page_url":"https://doi.org/10.3233/fi-2014-987","pdf_url":null,"source":{"id":"https://openalex.org/S39012697","display_name":"Fundamenta Informaticae","issn_l":"0169-2968","issn":["0169-2968","1875-8681"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Fundamenta Informaticae","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109139032","display_name":"Cuong Hoang","orcid":"https://orcid.org/0009-0005-2583-5332"},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]},{"id":"https://openalex.org/I177233841","display_name":"Vietnam National University, Hanoi","ror":"https://ror.org/02jmfj006","country_code":"VN","type":"education","lineage":["https://openalex.org/I177233841"]}],"countries":["PK","VN"],"is_corresponding":false,"raw_author_name":"Cuong Hoang","raw_affiliation_strings":["University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","institution_ids":["https://openalex.org/I177233841"]},{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067682200","display_name":"Anh-Cuong Le","orcid":"https://orcid.org/0000-0003-2645-1419"},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]},{"id":"https://openalex.org/I177233841","display_name":"Vietnam National University, Hanoi","ror":"https://ror.org/02jmfj006","country_code":"VN","type":"education","lineage":["https://openalex.org/I177233841"]}],"countries":["PK","VN"],"is_corresponding":false,"raw_author_name":"Anh-Cuong Le","raw_affiliation_strings":["University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","institution_ids":["https://openalex.org/I177233841"]},{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039374228","display_name":"Phuong-Thai Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]},{"id":"https://openalex.org/I177233841","display_name":"Vietnam National University, Hanoi","ror":"https://ror.org/02jmfj006","country_code":"VN","type":"education","lineage":["https://openalex.org/I177233841"]}],"countries":["PK","VN"],"is_corresponding":false,"raw_author_name":"Phuong-Thai Nguyen","raw_affiliation_strings":["University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","institution_ids":["https://openalex.org/I177233841"]},{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102175760","display_name":"Son Bao Pham","orcid":null},"institutions":[{"id":"https://openalex.org/I142732210","display_name":"University of Engineering and Technology Lahore","ror":"https://ror.org/0051w2v06","country_code":"PK","type":"education","lineage":["https://openalex.org/I142732210"]},{"id":"https://openalex.org/I177233841","display_name":"Vietnam National University, Hanoi","ror":"https://ror.org/02jmfj006","country_code":"VN","type":"education","lineage":["https://openalex.org/I177233841"]}],"countries":["PK","VN"],"is_corresponding":false,"raw_author_name":"Son Bao Pham","raw_affiliation_strings":["University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn","institution_ids":["https://openalex.org/I177233841"]},{"raw_affiliation_string":"University of Engineering and Technology, Vietnam National University, Hanoi, Vietnam. cuongh.mi10@vnu.edu.vn#TAB#","institution_ids":["https://openalex.org/I142732210"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101646487","display_name":"Tu Bao Ho","orcid":"https://orcid.org/0000-0001-5951-643X"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tu Bao Ho","raw_affiliation_strings":["Japan Advanced Institute of Science and Technology, Japan and John von Neumann Institute, Vietnam National University at Ho Chi Minh City, Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Japan Advanced Institute of Science and Technology, Japan and John von Neumann Institute, Vietnam National University at Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I177738480"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05049894,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"130","issue":"2","first_page":"179","last_page":"199"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7500048875808716},{"id":"https://openalex.org/keywords/parallel-corpora","display_name":"Parallel corpora","score":0.6173646450042725},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5743870735168457},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4600285291671753},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.37488436698913574},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.332302987575531},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.0736134946346283}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7500048875808716},{"id":"https://openalex.org/C2985367798","wikidata":"https://www.wikidata.org/wiki/Q1346592","display_name":"Parallel corpora","level":3,"score":0.6173646450042725},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5743870735168457},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4600285291671753},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.37488436698913574},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.332302987575531},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.0736134946346283}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/fi-2014-987","is_oa":false,"landing_page_url":"https://doi.org/10.3233/fi-2014-987","pdf_url":null,"source":{"id":"https://openalex.org/S39012697","display_name":"Fundamenta Informaticae","issn_l":"0169-2968","issn":["0169-2968","1875-8681"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310318577","host_organization_name":"IOS Press","host_organization_lineage":["https://openalex.org/P4310318577"],"host_organization_lineage_names":["IOS Press"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Fundamenta Informaticae","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6399999856948853,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W14574270","https://openalex.org/W1489181569","https://openalex.org/W1543107604","https://openalex.org/W1592081640","https://openalex.org/W1916559533","https://openalex.org/W1973152633","https://openalex.org/W1979531803","https://openalex.org/W2003948532","https://openalex.org/W2006969979","https://openalex.org/W2027189114","https://openalex.org/W2032175749","https://openalex.org/W2065565011","https://openalex.org/W2078861931","https://openalex.org/W2079078744","https://openalex.org/W2082172053","https://openalex.org/W2101105183","https://openalex.org/W2105313627","https://openalex.org/W2105673178","https://openalex.org/W2107695330","https://openalex.org/W2117652747","https://openalex.org/W2121227244","https://openalex.org/W2124807415","https://openalex.org/W2127128140","https://openalex.org/W2142843952","https://openalex.org/W2149327368","https://openalex.org/W2153653739","https://openalex.org/W2168929382","https://openalex.org/W2403876428","https://openalex.org/W2736790173","https://openalex.org/W2791294922","https://openalex.org/W2950186769"],"related_works":["https://openalex.org/W3204019825","https://openalex.org/W2143927888","https://openalex.org/W2242707303","https://openalex.org/W2757753881","https://openalex.org/W2123678043","https://openalex.org/W2125885330","https://openalex.org/W2902262852","https://openalex.org/W37319627","https://openalex.org/W1572297637","https://openalex.org/W2251265917"],"abstract_inverted_index":{"Automatically":[0],"building":[1,37],"a":[2,13,38,70,95,103],"large":[3,34],"bilingual":[4,112],"corpus":[5,31],"that":[6,78,98],"contains":[7],"millions":[8],"of":[9,20,87,121,138],"words":[10],"is":[11,24,33,94,99],"always":[12],"challenging":[14],"task.":[15],"In":[16],"particular":[17],"in":[18,50,56,82],"case":[19],"low-resource":[21],"languages,":[22],"it":[23],"difficult":[25],"to":[26,143],"find":[27],"an":[28],"existing":[29],"parallel":[30,65,75,132],"which":[32,60,80],"enough":[35],"for":[36,72,106,117],"real":[39],"statistical":[40,88],"machine":[41,89,139],"translation.":[42],"However,":[43],"comparable":[44],"non-parallel":[45],"corpora":[46,133],"are":[47],"richly":[48],"available":[49],"the":[51,85,108,118,136],"Internet":[52],"environment,":[53],"such":[54],"as":[55],"Wikipedia,":[57],"and":[58,123,125,134],"from":[59,77,141],"we":[61],"can":[62],"extract":[63],"valuable":[64],"texts.":[66],"This":[67],"work":[68],"presents":[69],"framework":[71,93],"effectively":[73],"extracting":[74],"sentences":[76],"resource,":[79],"results":[81,128],"significantly":[83],"improving":[84,135],"performance":[86],"translation":[90,140],"systems.":[91],"Our":[92],"bootstrapping-based":[96],"method":[97],"strengthened":[100],"by":[101],"using":[102],"new":[104],"measurement":[105],"estimating":[107],"similarity":[109],"between":[110],"two":[111],"sentences.":[113],"We":[114],"conduct":[115],"experiment":[116],"language":[119],"pair":[120],"English":[122,142],"Vietnamese":[124],"obtain":[126],"promising":[127],"on":[129],"both":[130],"constructing":[131],"accuracy":[137],"Vietnamese.":[144]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
