{"id":"https://openalex.org/W7083476839","doi":"https://doi.org/10.48550/arxiv.2509.20901","title":"CafGa: Customizing Feature Attributions to Explain Language Models","display_name":"CafGa: Customizing Feature Attributions to Explain Language Models","publication_year":2025,"publication_date":"2025-09-25","ids":{"openalex":"https://openalex.org/W7083476839","doi":"https://doi.org/10.48550/arxiv.2509.20901"},"language":"en","primary_location":{"id":"doi:10.48550/arxiv.2509.20901","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.20901","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2509.20901","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Boyle, Alan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Boyle, Alan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Cheng, Furui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Furui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zouhar, Vil\u00e9m","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zouhar, Vil\u00e9m","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"El-Assady, Mennatallah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"El-Assady, Mennatallah","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T13102","display_name":"Soil and Environmental Studies","score":0.09390000253915787,"subfield":{"id":"https://openalex.org/subfields/1111","display_name":"Soil Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T13102","display_name":"Soil and Environmental Studies","score":0.09390000253915787,"subfield":{"id":"https://openalex.org/subfields/1111","display_name":"Soil Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.08739999681711197,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12713","display_name":"Forest Ecology and Biodiversity Studies","score":0.06920000165700912,"subfield":{"id":"https://openalex.org/subfields/1109","display_name":"Insect Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/attribution","display_name":"Attribution","score":0.7401000261306763},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.7077999711036682},{"id":"https://openalex.org/keywords/feature-model","display_name":"Feature model","score":0.46700000762939453},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.39430001378059387},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3903999924659729},{"id":"https://openalex.org/keywords/computational-linguistics","display_name":"Computational linguistics","score":0.3628000020980835},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.3587000072002411}],"concepts":[{"id":"https://openalex.org/C143299363","wikidata":"https://www.wikidata.org/wiki/Q900584","display_name":"Attribution","level":2,"score":0.7401000261306763},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7105000019073486},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.7077999711036682},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5957000255584717},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5945000052452087},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.46700000762939453},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.39430001378059387},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3903999924659729},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3682999908924103},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3587000072002411},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3310999870300293},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C3020202489","wikidata":"https://www.wikidata.org/wiki/Q2032038","display_name":"Authorship attribution","level":2,"score":0.29820001125335693},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.2879999876022339},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2678999900817871},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.26510000228881836},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2509.20901","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.20901","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2509.20901","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.20901","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.420163094997406,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Feature":[0],"attribution":[1,39,80],"methods,":[2,40],"such":[3],"as":[4,45,126],"SHAP":[5],"and":[6,56,77,92,96,140],"LIME,":[7],"explain":[8,26],"machine":[9],"learning":[10],"model":[11],"predictions":[12],"by":[13,133],"quantifying":[14],"the":[15,34,94,143,146],"influence":[16],"of":[17,108,145],"each":[18],"input":[19],"component.":[20],"When":[21],"applying":[22],"feature":[23,38,79],"attributions":[24],"to":[25,58,130],"language":[27],"models,":[28],"a":[29,103],"basic":[30],"question":[31],"is":[32,49],"defining":[33],"interpretable":[35],"components.":[36],"Traditional":[37],"commonly":[41],"treat":[42],"individual":[43],"words":[44],"atomic":[46],"units.":[47],"This":[48],"highly":[50],"computationally":[51],"inefficient":[52],"for":[53,75,99],"long-form":[54],"text":[55],"fails":[57],"capture":[59],"semantic":[60],"information":[61],"that":[62],"spans":[63],"multiple":[64],"words.":[65],"To":[66],"address":[67],"this,":[68],"we":[69,111],"present":[70],"CafGa,":[71],"an":[72],"interactive":[73],"tool":[74],"generating":[76],"evaluating":[78],"explanations":[81],"at":[82],"customizable":[83],"granularities.":[84],"CafGa":[85,122],"supports":[86],"customized":[87],"segmentation":[88],"with":[89],"user":[90,104],"interaction":[91],"visualizes":[93],"deletion":[95],"insertion":[97],"curves":[98],"explanation":[100],"assessments.":[101],"Through":[102],"study":[105],"involving":[106],"participants":[107],"various":[109],"expertise,":[110],"confirm":[112],"CafGa's":[113],"usefulness,":[114],"particularly":[115],"among":[116],"LLM":[117],"practitioners.":[118],"Explanations":[119],"created":[120],"using":[121],"were":[123],"also":[124],"perceived":[125],"more":[127],"useful":[128],"compared":[129],"those":[131],"generated":[132],"two":[134],"fully":[135],"automatic":[136],"baseline":[137],"methods:":[138],"PartitionSHAP":[139],"MExGen,":[141],"suggesting":[142],"effectiveness":[144],"system.":[147]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
