{"id":"https://openalex.org/W7154352643","doi":"https://doi.org/10.48550/arxiv.2604.10345","title":"Fine-grained Multi-Document Extraction and Generation of Code Change Rationale","display_name":"Fine-grained Multi-Document Extraction and Generation of Code Change Rationale","publication_year":2026,"publication_date":"2026-04-11","ids":{"openalex":"https://openalex.org/W7154352643","doi":"https://doi.org/10.48550/arxiv.2604.10345"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.10345","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10345","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.10345","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133580817","display_name":"Mehedi Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Mehedi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113377928","display_name":"Antu Saha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saha, Antu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046232249","display_name":"Nadeeshan De Silva","orcid":"https://orcid.org/0000-0001-5325-9030"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"De Silva, Nadeeshan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069505458","display_name":"Antonio Mastropaolo","orcid":"https://orcid.org/0000-0002-7965-7712"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mastropaolo, Antonio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003334072","display_name":"Oscar Chaparro","orcid":"https://orcid.org/0000-0003-2838-685X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chaparro, Oscar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9836000204086304,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9836000204086304,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.00430000014603138,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.002899999963119626,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/commit","display_name":"Commit","score":0.8916000127792358},{"id":"https://openalex.org/keywords/code-refactoring","display_name":"Code refactoring","score":0.76910001039505},{"id":"https://openalex.org/keywords/program-comprehension","display_name":"Program comprehension","score":0.6877999901771545},{"id":"https://openalex.org/keywords/artifact","display_name":"Artifact (error)","score":0.6567000150680542},{"id":"https://openalex.org/keywords/java","display_name":"Java","score":0.5512999892234802},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4936999976634979},{"id":"https://openalex.org/keywords/software-maintenance","display_name":"Software maintenance","score":0.45249998569488525},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.3971000015735626},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.38359999656677246}],"concepts":[{"id":"https://openalex.org/C153180980","wikidata":"https://www.wikidata.org/wiki/Q19776675","display_name":"Commit","level":2,"score":0.8916000127792358},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8203999996185303},{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.76910001039505},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.6877999901771545},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.6567000150680542},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.5512999892234802},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.5374000072479248},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4936999976634979},{"id":"https://openalex.org/C101317890","wikidata":"https://www.wikidata.org/wiki/Q940053","display_name":"Software maintenance","level":4,"score":0.45249998569488525},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4352000057697296},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3971000015735626},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.38359999656677246},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3822999894618988},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.375900000333786},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.3619999885559082},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3555999994277954},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.35109999775886536},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.34470000863075256},{"id":"https://openalex.org/C202105479","wikidata":"https://www.wikidata.org/wiki/Q265013","display_name":"Software evolution","level":5,"score":0.3345000147819519},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.3260999917984009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.313400000333786},{"id":"https://openalex.org/C10272871","wikidata":"https://www.wikidata.org/wiki/Q929972","display_name":"Software inspection","level":5,"score":0.2935999929904938},{"id":"https://openalex.org/C160713754","wikidata":"https://www.wikidata.org/wiki/Q1389965","display_name":"Maintainability","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.2833999991416931},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.26969999074935913},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.26910001039505005},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2535000145435333},{"id":"https://openalex.org/C2777146004","wikidata":"https://www.wikidata.org/wiki/Q14949826","display_name":"CLARITY","level":2,"score":0.25200000405311584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.10345","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10345","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.10345","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.10345","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"the":[1,37,100,145,187,246,256],"reasons":[2],"behind":[3],"past":[4],"code":[5,178,238],"changes":[6],"is":[7,39,102],"critical":[8],"for":[9,34,147,206,234,248],"many":[10],"software":[11,266],"engineering":[12],"tasks,":[13],"including":[14],"refactoring":[15],"and":[16,21,27,44,55,91,107,115,123,150,165,171,180,190,203,232,241,254,264],"reviewing":[17],"code,":[18],"diagnosing":[19],"bugs,":[20],"implementing":[22],"new":[23],"features.":[24],"Unfortunately,":[25],"locating":[26],"reconstructing":[28],"this":[29,58,62],"rationale":[30,84,101,174,207,211,253],"can":[31],"be":[32],"difficult":[33],"developers":[35,222,262],"because":[36],"information":[38],"often":[40,119],"fragmented,":[41],"inconsistently":[42],"documented,":[43],"scattered":[45],"across":[46,95,167],"different":[47],"artifacts":[48,132,170],"such":[49,236],"as":[50,214,230,237],"commit":[51,105,135],"messages,":[52],"issue":[53],"reports,":[54],"PRs.":[56,124],"In":[57],"paper,":[59],"we":[60,68,153],"address":[61],"challenge":[63],"in":[64,121,131,251],"two":[65],"steps.":[66],"First,":[67],"conduct":[69],"an":[70,156],"empirical":[71],"study":[72,218],"of":[73,258],"63":[74,188],"commits":[75,189],"from":[76],"five":[77],"open-source":[78],"Java":[79,221],"projects":[80],"to":[81,176,260],"analyze":[82],"how":[83],"components":[85,126],"(e.g.,":[86],"a":[87,168],"change's":[88],"goal,":[89,163],"need,":[90,164],"alternative)":[92],"are":[93,117,127],"distributed":[94],"artifacts.":[96],"We":[97,183],"find":[98],"that":[99,159,225],"highly":[103],"fragmented:":[104],"messages":[106],"pull":[108],"requests":[109],"primarily":[110],"capture":[111],"goals,":[112],"while":[113,209],"needs":[114],"alternatives":[116],"more":[118],"found":[120,130],"issues":[122],"Other":[125],"scarce":[128],"but":[129],"other":[133],"than":[134],"messages.":[136],"No":[137],"single":[138],"artifact":[139],"type":[140],"captures":[141],"all":[142],"components,":[143],"underscoring":[144],"need":[146,247],"cross-document":[148],"reasoning":[149,250],"synthesis.":[151],"Second,":[152],"introduce":[154],"ARGUS,":[155],"LLM-based":[157],"approach":[158],"identifies":[160],"sentences":[161],"expressing":[162],"alternative":[166],"commit's":[169],"creates":[172],"concise":[173],"summaries":[175,212,227],"support":[177],"comprehension":[179],"maintenance":[181],"tasks.":[182],"evaluated":[184],"ARGUS":[185,259],"on":[186],"compared":[191],"its":[192],"performance":[193],"against":[194],"baseline":[195],"variants.":[196],"The":[197],"best-performing":[198],"version":[199],"achieved":[200],"51.4%":[201],"precision":[202],"93.2%":[204],"recall":[205],"identification,":[208],"producing":[210],"rated":[213],"accurate.":[215],"A":[216],"user":[217],"with":[219],"12":[220],"further":[223],"showed":[224],"these":[226],"were":[228],"perceived":[229],"useful":[231],"helpful":[233],"tasks":[235],"review,":[239],"documentation,":[240],"debugging.":[242],"Our":[243],"results":[244],"highlight":[245],"multi-document":[249],"capturing":[252],"demonstrate":[255],"potential":[257],"help":[261],"understand":[263],"maintain":[265],"systems.":[267]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-15T00:00:00"}
