{"id":"https://openalex.org/W7131383751","doi":"https://doi.org/10.48550/arxiv.2602.19407","title":"Multi-CoLoR: Context-Aware Localization and Reasoning across Multi-Language Codebases","display_name":"Multi-CoLoR: Context-Aware Localization and Reasoning across Multi-Language Codebases","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131383751","doi":"https://doi.org/10.48550/arxiv.2602.19407"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.19407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.19407","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056499909","display_name":"Indira Vats","orcid":"https://orcid.org/0000-0002-8605-766X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Vats, Indira","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126686384","display_name":"Sanjukta De","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De, Sanjukta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126711710","display_name":"Subhayan Roy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roy, Subhayan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034804814","display_name":"Saurabh Bodhe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bodhe, Saurabh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126737333","display_name":"Lejin Varghese","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Varghese, Lejin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073041618","display_name":"Max Kiehn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kiehn, Max","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5118792451","display_name":"Yonas Bedasso","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bedasso, Yonas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Chechik, Marsha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chechik, Marsha","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5056499909"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9354000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9354000091552734,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.012400000356137753,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.007499999832361937,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/traverse","display_name":"Traverse","score":0.6053000092506409},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5997999906539917},{"id":"https://openalex.org/keywords/tree-traversal","display_name":"Tree traversal","score":0.5914999842643738},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5820000171661377},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5493000149726868},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.43070000410079956},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.41040000319480896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8048999905586243},{"id":"https://openalex.org/C176809094","wikidata":"https://www.wikidata.org/wiki/Q15401496","display_name":"Traverse","level":2,"score":0.6053000092506409},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5997999906539917},{"id":"https://openalex.org/C140745168","wikidata":"https://www.wikidata.org/wiki/Q1210082","display_name":"Tree traversal","level":2,"score":0.5914999842643738},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5820000171661377},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5493000149726868},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46959999203681946},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.43070000410079956},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.41040000319480896},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3894999921321869},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3880999982357025},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.3732999861240387},{"id":"https://openalex.org/C96333769","wikidata":"https://www.wikidata.org/wiki/Q907955","display_name":"Graph traversal","level":3,"score":0.37299999594688416},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3407999873161316},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3361000120639801},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.31529998779296875},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3142000138759613},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3075000047683716}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.19407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.19407","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.19407","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"demonstrate":[3],"strong":[4],"capabilities":[5],"in":[6,90],"code":[7,21,49,115],"generation":[8],"but":[9],"struggle":[10],"to":[11,16,83,107],"navigate":[12],"complex,":[13],"multi-language":[14],"repositories":[15],"locate":[17],"relevant":[18],"code.":[19],"Effective":[20],"localization":[22,126,152],"requires":[23],"understanding":[24],"both":[25,167],"organizational":[26,77],"context":[27,97],"(e.g.,":[28],"historical":[29,105],"issue-fix":[30],"patterns)":[31],"and":[32,70,102,112,133,150,154,169],"structural":[33,129],"relationships":[34],"within":[35,131],"heterogeneous":[36],"codebases.":[37,135],"Existing":[38],"methods":[39],"either":[40],"(i)":[41,93],"focus":[42],"narrowly":[43],"on":[44,137,176],"single-language":[45],"benchmarks,":[46],"(ii)":[47,113],"retrieve":[48],"across":[50,72],"languages":[51],"via":[52],"shallow":[53],"textual":[54],"similarity,":[55],"or":[56],"(iii)":[57],"assume":[58],"no":[59],"prior":[60],"context.":[61],"We":[62],"present":[63],"Multi-CoLoR,":[64],"a":[65,94,114,124,138],"framework":[66],"for":[67],"Context-aware":[68],"Localization":[69],"Reasoning":[71],"Multi-Language":[73],"codebases,":[74],"which":[75],"integrates":[76],"knowledge":[78],"retrieval":[79],"with":[80],"graph-based":[81,155,170],"reasoning":[82,130,156],"traverse":[84],"complex":[85],"software":[86],"ecosystems.":[87],"Multi-CoLoR":[88,163],"operates":[89],"two":[91],"stages:":[92],"similar":[95],"issue":[96],"(SIC)":[98],"module":[99],"retrieves":[100],"semantically":[101],"organizationally":[103],"related":[104],"issues":[106],"prune":[108],"the":[109,147],"search":[110,148],"space,":[111],"graph":[116],"traversal":[117],"agent":[118],"(an":[119],"extended":[120],"version":[121],"of":[122],"LocAgent,":[123],"state-of-the-art":[125],"framework)":[127],"performs":[128],"C++":[132],"QML":[134],"Evaluations":[136],"real-world":[139],"enterprise":[140],"dataset":[141],"show":[142],"that":[143],"incorporating":[144],"SIC":[145],"reduces":[146],"space":[149],"improves":[151,164],"accuracy,":[153],"generalizes":[157],"effectively":[158],"beyond":[159],"Python-only":[160],"repositories.":[161],"Combined,":[162],"Acc@5":[165],"over":[166],"lexical":[168],"baselines":[171],"while":[172],"reducing":[173],"tool":[174],"calls":[175],"an":[177],"AMD":[178],"codebase.":[179]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-02-26T00:00:00"}
