{"id":"https://openalex.org/W2089379373","doi":"https://doi.org/10.3115/1117794.1117806","title":"Cross-lingual information retrieval using hidden Markov models","display_name":"Cross-lingual information retrieval using hidden Markov models","publication_year":2000,"publication_date":"2000-01-01","ids":{"openalex":"https://openalex.org/W2089379373","doi":"https://doi.org/10.3115/1117794.1117806","mag":"2089379373"},"language":"en","primary_location":{"id":"doi:10.3115/1117794.1117806","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117806","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117806","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117806","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108487796","display_name":"Jinxi Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jinxi Xu","raw_affiliation_strings":["BBN Technologies, Cambridge, MA"],"affiliations":[{"raw_affiliation_string":"BBN Technologies, Cambridge, MA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011618765","display_name":"Ralph Weischedel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ralph Weischedel","raw_affiliation_strings":["BBN Technologies, Cambridge, MA"],"affiliations":[{"raw_affiliation_string":"BBN Technologies, Cambridge, MA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5108487796"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.6955,"has_fulltext":true,"cited_by_count":59,"citation_normalized_percentile":{"value":0.94413592,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"13","issue":null,"first_page":"95","last_page":"103"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8587318658828735},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.6487197875976562},{"id":"https://openalex.org/keywords/bilingual-dictionary","display_name":"Bilingual dictionary","score":0.6270122528076172},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.6209186315536499},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6032134890556335},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5894142985343933},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5670932531356812},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5480827689170837},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5440908670425415},{"id":"https://openalex.org/keywords/cross-language-information-retrieval","display_name":"Cross-language information retrieval","score":0.4491698741912842},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.4437364935874939},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.4371238946914673},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.4170340597629547}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8587318658828735},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.6487197875976562},{"id":"https://openalex.org/C2779235283","wikidata":"https://www.wikidata.org/wiki/Q2640207","display_name":"Bilingual dictionary","level":2,"score":0.6270122528076172},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.6209186315536499},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6032134890556335},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5894142985343933},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5670932531356812},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5480827689170837},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5440908670425415},{"id":"https://openalex.org/C2778842860","wikidata":"https://www.wikidata.org/wiki/Q986551","display_name":"Cross-language information retrieval","level":3,"score":0.4491698741912842},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.4437364935874939},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.4371238946914673},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.4170340597629547},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3115/1117794.1117806","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117806","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117806","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.3620","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.3620","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/W/W00/W00-1312.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.336.9477","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.336.9477","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.mt-archive.info/EMNLP-2000-Xu.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.415.8856","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.415.8856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.jhu.edu/~yarowsky/acl2000/sigdat/xu.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.3115/1117794.1117806","is_oa":true,"landing_page_url":"https://doi.org/10.3115/1117794.1117806","pdf_url":"https://dl.acm.org/doi/pdf/10.3115/1117794.1117806","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2000 Joint SIGDAT conference on Empirical methods in natural language processing and very large corpora held in conjunction with the 38th Annual Meeting of the Association for Computational Linguistics -","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.800000011920929,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2089379373.pdf","grobid_xml":"https://content.openalex.org/works/W2089379373.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W41800150","https://openalex.org/W1490627662","https://openalex.org/W1540124269","https://openalex.org/W1570490112","https://openalex.org/W1589050831","https://openalex.org/W1980515494","https://openalex.org/W2008248260","https://openalex.org/W2008495066","https://openalex.org/W2015629112","https://openalex.org/W2021822930","https://openalex.org/W2044157185","https://openalex.org/W2082729696","https://openalex.org/W2093390569","https://openalex.org/W2093976457","https://openalex.org/W2095368471","https://openalex.org/W2110189854","https://openalex.org/W2118305464","https://openalex.org/W2125838338","https://openalex.org/W2161935199","https://openalex.org/W4206765718","https://openalex.org/W4231488796","https://openalex.org/W4253573210","https://openalex.org/W4253938478","https://openalex.org/W6645197570"],"related_works":["https://openalex.org/W2251642064","https://openalex.org/W104838891","https://openalex.org/W1018161198","https://openalex.org/W2802443881","https://openalex.org/W2400846488","https://openalex.org/W1956839949","https://openalex.org/W2153428533","https://openalex.org/W2062630764","https://openalex.org/W2117119592","https://openalex.org/W2155836137"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"empirical":[3],"results":[4],"in":[5,27],"cross-lingual":[6],"information":[7],"retrieval":[8,60],"using":[9],"English":[10],"queries":[11],"to":[12],"access":[13],"Chinese":[14],"documents":[15,21],"(TREC-5":[16],"and":[17,19,59],"TREC-6)":[18],"Spanish":[20],"(TREC-4).":[22],"Since":[23],"our":[24],"interest":[25],"is":[26],"languages":[28],"where":[29],"resources":[30],"may":[31],"be":[32],"minimal,":[33],"we":[34,70],"use":[35],"an":[36,72],"integrated":[37],"probabilistic":[38],"model":[39,55],"that":[40],"requires":[41],"only":[42],"a":[43,47,52,81,89],"bilingual":[44,92],"dictionary":[45,93],"as":[46,88],"resource.":[48],"We":[49,84],"explore":[50],"how":[51],"combined":[53],"probability":[54],"of":[56,65,91],"term":[57],"translation":[58,66,78],"can":[61],"reduce":[62],"the":[63],"effect":[64],"ambiguity.":[67],"In":[68],"addition,":[69],"estimate":[71],"upper":[73],"bound":[74],"on":[75],"performance,":[76],"if":[77],"ambiguity":[79],"were":[80],"solved":[82],"problem.":[83],"also":[85],"measure":[86],"performance":[87],"function":[90],"size.":[94]},"counts_by_year":[{"year":2024,"cited_by_count":22},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
