{"id":"https://openalex.org/W7105985986","doi":"https://doi.org/10.48550/arxiv.2511.13040","title":"How Good is BLI as an Alignment Measure: A Study in Word Embedding Paradigm","display_name":"How Good is BLI as an Alignment Measure: A Study in Word Embedding Paradigm","publication_year":2025,"publication_date":"2025-11-17","ids":{"openalex":"https://openalex.org/W7105985986","doi":"https://doi.org/10.48550/arxiv.2511.13040"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2511.13040","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.13040","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2511.13040","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wickramasinghe, Kasun","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wickramasinghe, Kasun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"de Silva, Nisansa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Silva, Nisansa","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.3540000021457672,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.3540000021457672,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1251000016927719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.08150000125169754,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7612000107765198},{"id":"https://openalex.org/keywords/degree","display_name":"Degree (music)","score":0.5357000231742859},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.5246999859809875},{"id":"https://openalex.org/keywords/lexicon","display_name":"Lexicon","score":0.48429998755455017},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.47200000286102295},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4657999873161316},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.4269999861717224},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.42489999532699585}],"concepts":[{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7612000107765198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7003999948501587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5950000286102295},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5763000249862671},{"id":"https://openalex.org/C2775997480","wikidata":"https://www.wikidata.org/wiki/Q586277","display_name":"Degree (music)","level":2,"score":0.5357000231742859},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.5246999859809875},{"id":"https://openalex.org/C2778121359","wikidata":"https://www.wikidata.org/wiki/Q8096","display_name":"Lexicon","level":2,"score":0.48429998755455017},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.47200000286102295},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4657999873161316},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.4269999861717224},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.42489999532699585},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.3596000075340271},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.3319999873638153},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.3228999972343445},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.30309998989105225},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C2780035574","wikidata":"https://www.wikidata.org/wiki/Q30081","display_name":"Multilingualism","level":2,"score":0.30160000920295715},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C35435516","wikidata":"https://www.wikidata.org/wiki/Q5370016","display_name":"Embedding problem","level":3,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2511.13040","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.13040","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2511.13040","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.13040","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5644962191581726,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Sans":[0],"a":[1,44,89,130,212,243],"dwindling":[2],"number":[3],"of":[4,33,54,80,100,108,112,127,136,138,164,178,186,199,230,255],"monolingual":[5,56,70],"embedding":[6,19,116,140,148,221,263,267],"studies":[7],"originating":[8],"predominantly":[9],"from":[10],"the":[11,22,31,37,51,64,76,92,101,110,123,134,162,176,179,184,196,227,235,253,256],"low-resource":[12,168,281],"domains,":[13],"it":[14],"is":[15,59,87,98,248],"evident":[16],"that":[17,191,223,247],"multilingual":[18,41,65,81,152,262,276],"has":[20],"become":[21],"de":[23],"facto":[24],"choice":[25],"due":[26],"to":[27,30,39,132,172,182,217,234],"its":[28],"adaptability":[29],"usage":[32],"code-mixed":[34],"languages,":[35],"granting":[36],"ability":[38],"process":[40],"documents":[42],"in":[43,72,106,161,201,251,273],"language-agnostic":[45],"manner,":[46],"as":[47,49,129,232],"well":[48,146],"removing":[50],"difficult":[52],"task":[53],"aligning":[55],"embeddings.":[57],"But":[58],"this":[60,119],"victory":[61],"complete?":[62],"Are":[63],"models":[66,71,82],"better":[67,271,279],"than":[68],"aligned":[69,220],"every":[73],"aspect?":[74],"Can":[75],"higher":[77],"computational":[78],"cost":[79],"always":[83],"be":[84],"justified?":[85],"Or":[86],"there":[88],"compromise":[90],"between":[91,114],"two":[93,115,139,219],"extremes?":[94],"Bilingual":[95],"Lexicon":[96],"Induction":[97],"one":[99],"most":[102],"widely":[103],"used":[104],"metrics":[105],"terms":[107],"evaluating":[109],"degree":[111,135,198,254],"alignment":[113,137,149,156,200,268],"spaces.":[117,141],"In":[118,170],"study,":[120],"we":[121,143,174,205,241],"explore":[122],"strengths":[124],"and":[125,154,167,204],"limitations":[126],"BLI":[128,159,192,215,238,260],"measure":[131,195],"evaluate":[133,144,218],"Further,":[142,240],"how":[145],"traditional":[147],"techniques,":[150],"novel":[151,213],"models,":[153],"combined":[155,266],"techniques":[157,269],"perform":[158,270,278],"tasks":[160],"contexts":[163],"both":[165],"high-resource":[166],"languages.":[169],"addition":[171],"that,":[173],"investigate":[175],"impact":[177],"language":[180,282],"families":[181],"which":[183],"pairs":[185],"languages":[187,231],"belong.":[188],"We":[189,210],"identify":[190],"does":[193],"not":[194],"true":[197],"some":[202],"cases":[203,275],"propose":[206,211],"solutions":[207],"for":[208],"them.":[209],"stem-based":[214],"approach":[216],"spaces":[222],"take":[224],"into":[225],"account":[226],"inflected":[228],"nature":[229],"opposed":[233],"prevalent":[236],"word-based":[237],"techniques.":[239],"introduce":[242],"vocabulary":[244],"pruning":[245],"technique":[246],"more":[249],"informative":[250],"showing":[252],"alignment,":[257],"especially":[258],"performing":[259],"on":[261],"models.":[264],"Often,":[265],"while":[272],"certain":[274],"embeddings":[277],"(mainly":[280],"cases).":[283]},"counts_by_year":[],"updated_date":"2025-11-19T23:39:43.309859","created_date":"2025-11-19T00:00:00"}
