{"id":"https://openalex.org/W7081971863","doi":"https://doi.org/10.5715/jnlp.32.886","title":"Cross-lingual Contextualized Phrase Retrieval","display_name":"Cross-lingual Contextualized Phrase Retrieval","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7081971863","doi":"https://doi.org/10.5715/jnlp.32.886"},"language":"en","primary_location":{"id":"doi:10.5715/jnlp.32.886","is_oa":true,"landing_page_url":"https://doi.org/10.5715/jnlp.32.886","pdf_url":"https://www.jstage.jst.go.jp/article/jnlp/32/3/32_886/_pdf","source":{"id":"https://openalex.org/S4210212357","display_name":"Journal of Natural Language Processing","issn_l":"1340-7619","issn":["1340-7619","2185-8314"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Natural Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/jnlp/32/3/32_886/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Huayang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Huayang Li","raw_affiliation_strings":["Nara Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Deng Cai","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Deng Cai","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhi Qu","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Zhi Qu","raw_affiliation_strings":["Nara Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qu Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qu Cui","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hidetaka Kamigaito","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hidetaka Kamigaito","raw_affiliation_strings":["Nara Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Lemao Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lemao Liu","raw_affiliation_strings":["Tencent AI Lab"],"affiliations":[{"raw_affiliation_string":"Tencent AI Lab","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":null,"display_name":"Taro Watanabe","orcid":null},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Taro Watanabe","raw_affiliation_strings":["Nara Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.63276306,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"32","issue":"3","first_page":"886","last_page":"917"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6744999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12157","display_name":"Geochemistry and Geologic Mapping","score":0.6744999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13067","display_name":"Geological Modeling and Analysis","score":0.028599999845027924,"subfield":{"id":"https://openalex.org/subfields/1906","display_name":"Geochemistry and Petrology"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14311","display_name":"Electrical and Electromagnetic Research","score":0.018300000578165054,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.7628999948501587},{"id":"https://openalex.org/keywords/polysemy","display_name":"Polysemy","score":0.6891999840736389},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5648000240325928},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5509999990463257},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5472999811172485},{"id":"https://openalex.org/keywords/noun-phrase","display_name":"Noun phrase","score":0.534500002861023},{"id":"https://openalex.org/keywords/phrase-structure-rules","display_name":"Phrase structure rules","score":0.38530001044273376}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.808899998664856},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.7628999948501587},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7545999884605408},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6987000107765198},{"id":"https://openalex.org/C2780276568","wikidata":"https://www.wikidata.org/wiki/Q191928","display_name":"Polysemy","level":2,"score":0.6891999840736389},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5648000240325928},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5509999990463257},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5472999811172485},{"id":"https://openalex.org/C153962237","wikidata":"https://www.wikidata.org/wiki/Q1401131","display_name":"Noun phrase","level":3,"score":0.534500002861023},{"id":"https://openalex.org/C80877019","wikidata":"https://www.wikidata.org/wiki/Q7188074","display_name":"Phrase structure rules","level":3,"score":0.38530001044273376},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.38339999318122864},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.3659000098705292},{"id":"https://openalex.org/C88880766","wikidata":"https://www.wikidata.org/wiki/Q1201147","display_name":"Determiner phrase","level":4,"score":0.35339999198913574},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.31279999017715454},{"id":"https://openalex.org/C131042201","wikidata":"https://www.wikidata.org/wiki/Q493198","display_name":"Endocentric and exocentric","level":4,"score":0.27559998631477356},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2671000063419342},{"id":"https://openalex.org/C2779514573","wikidata":"https://www.wikidata.org/wiki/Q1778442","display_name":"Verb phrase","level":4,"score":0.2644999921321869},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C28076734","wikidata":"https://www.wikidata.org/wiki/Q63087","display_name":"Coreference","level":3,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5715/jnlp.32.886","is_oa":true,"landing_page_url":"https://doi.org/10.5715/jnlp.32.886","pdf_url":"https://www.jstage.jst.go.jp/article/jnlp/32/3/32_886/_pdf","source":{"id":"https://openalex.org/S4210212357","display_name":"Journal of Natural Language Processing","issn_l":"1340-7619","issn":["1340-7619","2185-8314"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Natural Language Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.5715/jnlp.32.886","is_oa":true,"landing_page_url":"https://doi.org/10.5715/jnlp.32.886","pdf_url":"https://www.jstage.jst.go.jp/article/jnlp/32/3/32_886/_pdf","source":{"id":"https://openalex.org/S4210212357","display_name":"Journal of Natural Language Processing","issn_l":"1340-7619","issn":["1340-7619","2185-8314"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Natural Language Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6210674047470093,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7081971863.pdf","grobid_xml":"https://content.openalex.org/works/W7081971863.grobid-xml"},"referenced_works_count":41,"referenced_works":["https://openalex.org/W2141532438","https://openalex.org/W2152263452","https://openalex.org/W2153653739","https://openalex.org/W2156985047","https://openalex.org/W2788330850","https://openalex.org/W2905342727","https://openalex.org/W2952682849","https://openalex.org/W2962784628","https://openalex.org/W2963047628","https://openalex.org/W2963469388","https://openalex.org/W2963829526","https://openalex.org/W2963967365","https://openalex.org/W2963979492","https://openalex.org/W2970168256","https://openalex.org/W2970295111","https://openalex.org/W2970618241","https://openalex.org/W2987249037","https://openalex.org/W3001434439","https://openalex.org/W3016973796","https://openalex.org/W3035390927","https://openalex.org/W3039695075","https://openalex.org/W3099700870","https://openalex.org/W3100806282","https://openalex.org/W3105214104","https://openalex.org/W3155609600","https://openalex.org/W3156636935","https://openalex.org/W3170427498","https://openalex.org/W3174160883","https://openalex.org/W3175627818","https://openalex.org/W3175863856","https://openalex.org/W3176913643","https://openalex.org/W3194782062","https://openalex.org/W4206555128","https://openalex.org/W4224299209","https://openalex.org/W4285226496","https://openalex.org/W4385571209","https://openalex.org/W4385571506","https://openalex.org/W4385574194","https://openalex.org/W4385574304","https://openalex.org/W4404781563","https://openalex.org/W4404784207"],"related_works":[],"abstract_inverted_index":{"Phrase-level":[0],"dense":[1,30],"retrieval":[2,117,134],"has":[3],"shown":[4],"many":[5],"appealing":[6],"characteristics":[7],"in":[8,170,189],"downstream":[9,121],"NLP":[10],"tasks":[11],"by":[12,42,139],"leveraging":[13],"the":[14,49,58,97,114,127,132,159,185,190],"fine-grained":[15],"information":[16,77],"that":[17,147],"phrases":[18,73,101],"offer.":[19],"In":[20],"our":[21,63,86],"work,":[22],"we":[23,68,84],"propose":[24],"a":[25,66,120,140,144],"new":[26],"task":[27,118],"formulation":[28],"of":[29,51,71,100,129,166,184,197],"retrieval,":[31,35],"cross-lingual":[32,40,72,115],"contextualized":[33],"phrase":[34,116,133],"which":[36,95],"aims":[37],"to":[38,61,107,157],"augment":[39,158],"applications":[41],"addressing":[43],"polysemy":[44],"using":[45,74,92],"context":[46],"information.":[47],"However,":[48],"lack":[50],"specific":[52],"training":[53],"data":[54],"and":[55,105,119,168,176,212],"models":[56],"are":[57],"primary":[59],"challenges":[60],"achieve":[62],"goal.":[64],"As":[65],"result,":[67],"extract":[69],"pairs":[70],"word":[75],"alignment":[76],"automatically":[78],"induced":[79],"from":[80,174],"parallel":[81],"sentences.":[82],"Subsequently,":[83],"train":[85],"Cross-lingual":[87],"Contextualized":[88],"Phrase":[89],"Retriever":[90],"(CCPR)":[91],"contrastive":[93],"learning,":[94],"encourages":[96],"hidden":[98],"representations":[99],"with":[102],"similar":[103],"contexts":[104],"semantics":[106],"align":[108],"closely.":[109],"Comprehensive":[110],"experiments":[111],"on":[112,202],"both":[113],"task,":[122,135],"i.e,":[123],"machine":[124],"translation,":[125],"demonstrate":[126],"effectiveness":[128],"CCPR.":[130],"On":[131],"CCPR":[136,156],"surpasses":[137],"baselines":[138],"significant":[141],"margin,":[142],"achieving":[143],"top-1":[145],"accuracy":[146],"is":[148,182],"at":[149,198],"least":[150,199],"13":[151],"points":[152],"higher.":[153],"When":[154],"utilizing":[155],"large-language-model-based":[160],"translator,":[161],"it":[162],"achieves":[163,195],"average":[164],"gains":[165,196],"0.7":[167,200],"1.5":[169],"BERTScore":[171,201],"for":[172],"translations":[173,203],"X\u21a0En":[175],"vice":[177],"versa,":[178],"respectively,":[179],"where":[180],"X":[181],"one":[183],"six":[186],"Indo-European":[187],"languages":[188],"WMT16":[191],"dataset.":[192],"It":[193],"also":[194],"into":[204],"East":[205],"Asian":[206],"languages,":[207],"such":[208],"as":[209],"Japanese,":[210],"Chinese,":[211],"Korean.":[213]},"counts_by_year":[],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-10-10T00:00:00"}
