{"id":"https://openalex.org/W1983201496","doi":"https://doi.org/10.3115/1117794.1117808","title":"Word alignment of English-Chinese bilingual corpus based on chunks","display_name":"Word alignment of English-Chinese bilingual corpus based on chunks","publication_year":2000,"publication_date":"2000-01-01","ids":{"openalex":"https://openalex.org/W1983201496","doi":"https://doi.org/10.3115/1117794.1117808","mag":"1983201496"},"language":"en","primary_location":{"id":"doi:10.3115/1117794.1117808","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117808","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=1117808&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"http://dl.acm.org/ft_gateway.cfm?id=1117808&type=pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101652785","display_name":"Le Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Le Sun","raw_affiliation_strings":["Chinese Academy of Sciences, Beijing, P R China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Beijing, P R China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021266867","display_name":"Youbing Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youbing Jin","raw_affiliation_strings":["Chinese Academy of Sciences, Beijing, P R China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Beijing, P R China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101907171","display_name":"Lin Du","orcid":"https://orcid.org/0000-0002-3174-7110"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Du","raw_affiliation_strings":["Chinese Academy of Sciences, Beijing, P R China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Beijing, P R China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100304840","display_name":"Yufang Sun","orcid":"https://orcid.org/0009-0004-3915-280X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yufang Sun","raw_affiliation_strings":["Chinese Academy of Sciences, Beijing, P R China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences, Beijing, P R China","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101652785"],"corresponding_institution_ids":["https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":0.5307,"has_fulltext":true,"cited_by_count":22,"citation_normalized_percentile":{"value":0.7571489,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"13","issue":null,"first_page":"110","last_page":"116"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9789999723434448,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8395268321037292},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7654440402984619},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6749773621559143},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5986154079437256},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.48578861355781555},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.4483359456062317},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.4461011588573456},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4016456604003906},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.32018351554870605}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8395268321037292},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7654440402984619},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6749773621559143},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5986154079437256},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.48578861355781555},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.4483359456062317},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.4461011588573456},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4016456604003906},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.32018351554870605},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3115/1117794.1117808","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117808","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=1117808&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.8514","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.8514","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/W/W00/W00-1314.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/1117794.1117808","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117808","pdf_url":"http://dl.acm.org/ft_gateway.cfm?id=1117808&type=pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7699999809265137}],"awards":[{"id":"https://openalex.org/G5249178904","display_name":null,"funder_award_id":"Grant No. 6","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1983201496.pdf","grobid_xml":"https://content.openalex.org/works/W1983201496.grobid-xml"},"referenced_works_count":13,"referenced_works":["https://openalex.org/W77384058","https://openalex.org/W125383268","https://openalex.org/W1489181569","https://openalex.org/W1503785188","https://openalex.org/W2006969979","https://openalex.org/W2065627366","https://openalex.org/W2074992284","https://openalex.org/W2075728986","https://openalex.org/W2088791674","https://openalex.org/W2097125878","https://openalex.org/W2138584836","https://openalex.org/W2151525026","https://openalex.org/W6674474963"],"related_works":["https://openalex.org/W4234874385","https://openalex.org/W2323648130","https://openalex.org/W2157140558","https://openalex.org/W2378782423","https://openalex.org/W2388988621","https://openalex.org/W2357797405","https://openalex.org/W2366623913","https://openalex.org/W2374905595","https://openalex.org/W2516693588","https://openalex.org/W2116112408"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"a":[3,64],"method":[4],"for":[5],"the":[6,26,35,52,59,83],"word":[7],"alignment":[8],"of":[9,19,29,37,45],"English-Chinese":[10],"corpus":[11,80],"based":[12],"on":[13],"chunks":[14,18,39],"is":[15,68],"proposed.":[16],"The":[17,43],"English":[20,38,56],"sentences":[21,31],"are":[22,32,49],"identified":[23],"firstly.":[24],"Then":[25],"chunk":[27,47,60],"boundaries":[28,48],"Chinese":[30,46],"predicted":[33],"by":[34,51,78],"translations":[36],"and":[40,81],"heuristic":[41],"information.":[42],"ambiguities":[44],"resolved":[50],"coterminous":[53],"words":[54],"in":[55],"chunks.":[57],"With":[58],"aligned":[61],"bilingual":[62],"corpus,":[63],"translation":[65],"relation":[66],"probability":[67],"proposed":[69],"to":[70],"align":[71],"words.":[72],"Finally,":[73],"we":[74],"evaluate":[75],"our":[76],"system":[77],"real":[79],"present":[82],"experiment":[84],"results.":[85]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
