{"id":"https://openalex.org/W4283371089","doi":"https://doi.org/10.48550/arxiv.2206.11212","title":"VisFIS: Visual Feature Importance Supervision with Right-for-the-Right-Reason Objectives","display_name":"VisFIS: Visual Feature Importance Supervision with Right-for-the-Right-Reason Objectives","publication_year":2022,"publication_date":"2022-06-22","ids":{"openalex":"https://openalex.org/W4283371089","doi":"https://doi.org/10.48550/arxiv.2206.11212"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2206.11212","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.11212","pdf_url":"https://arxiv.org/pdf/2206.11212","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2206.11212","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033138733","display_name":"Zhuofan Ying","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ying, Zhuofan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013096489","display_name":"Peter Hase","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hase, Peter","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5001987532","display_name":"Mohit Bansal","orcid":"https://orcid.org/0000-0001-5522-1351"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bansal, Mohit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9830999970436096,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6732566952705383},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6224396228790283},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5555039644241333},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5532587170600891},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4663497805595398},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4127802550792694}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6732566952705383},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6224396228790283},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5555039644241333},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5532587170600891},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4663497805595398},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4127802550792694},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2206.11212","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.11212","pdf_url":"https://arxiv.org/pdf/2206.11212","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2206.11212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2206.11212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2206.11212","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.11212","pdf_url":"https://arxiv.org/pdf/2206.11212","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.46000000834465027}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W2951187577","https://openalex.org/W3046775127","https://openalex.org/W3107602296","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Many":[0],"past":[1,161],"works":[2],"aim":[3],"to":[4,118],"improve":[5,77],"visual":[6],"reasoning":[7],"in":[8,120,152],"models":[9],"by":[10,15,90],"supervising":[11],"feature":[12,38],"importance":[13,39],"(estimated":[14],"model":[16,61,72,79,95,128,224,244],"explanation":[17,173,183],"techniques)":[18],"with":[19,50,63],"human":[20,64,132],"annotations":[21],"such":[22],"as":[23,81,83],"highlights":[24],"of":[25,116,154,222,239],"important":[26,111],"image":[27],"regions.":[28],"However,":[29],"recent":[30],"work":[31,162],"has":[32],"shown":[33],"that":[34,54,71,164,177],"performance":[35,84],"gains":[36],"from":[37],"(FI)":[40],"supervision":[41,74],"for":[42,92,167,228,242],"Visual":[43,140],"Question":[44],"Answering":[45],"(VQA)":[46],"tasks":[47],"persist":[48],"even":[49],"random":[51],"supervision,":[52],"suggesting":[53],"these":[55,240],"methods":[56],"do":[57],"not":[58,204,210,220],"meaningfully":[59,76],"align":[60],"FI":[62,73,129,133],"FI.":[65],"In":[66],"this":[67,178],"paper,":[68],"we":[69,175,213],"show":[70,176,214],"can":[75],"VQA":[78,150],"accuracy":[80,169,225],"well":[82],"on":[85,148,182],"several":[86],"Right-for-the-Right-Reason":[87],"(RRR)":[88],"metrics":[89,218,241],"optimizing":[91],"four":[93],"key":[94],"objectives:":[96],"(1)":[97],"accurate":[98,196],"predictions":[99,108,117],"given":[100,109],"limited":[101],"but":[102,209],"sufficient":[103],"information":[104,112],"(Sufficiency);":[105],"(2)":[106],"max-entropy":[107],"no":[110],"(Uncertainty);":[113],"(3)":[114],"invariance":[115],"changes":[119],"unimportant":[121],"features":[122],"(Invariance);":[123],"and":[124,131,157,201,203],"(4)":[125],"alignment":[126],"between":[127],"explanations":[130,134,186,198],"(Plausibility).":[135],"Our":[136],"best":[137],"performing":[138],"method,":[139],"Feature":[141],"Importance":[142],"Supervision":[143],"(VisFIS),":[144],"outperforms":[145],"strong":[146],"baselines":[147],"benchmark":[149],"datasets":[151],"terms":[153],"both":[155],"in-distribution":[156,231],"out-of-distribution":[158,223],"accuracy.":[159],"While":[160],"suggests":[163],"the":[165,189,237],"mechanism":[166],"improved":[168,172],"is":[170,249],"through":[171],"plausibility,":[174],"relationship":[179],"depends":[180],"crucially":[181],"faithfulness":[184],"(whether":[185],"truly":[187],"represent":[188],"model's":[190,230],"internal":[191],"reasoning).":[192],"Predictions":[193],"are":[194,199,207,219],"more":[195],"when":[197,205,226],"plausible":[200,208],"faithful,":[202],"they":[206],"faithful.":[211],"Lastly,":[212],"that,":[215],"surprisingly,":[216],"RRR":[217],"predictive":[221],"controlling":[227],"a":[229],"accuracy,":[232],"which":[233],"calls":[234],"into":[235],"question":[236],"value":[238],"evaluating":[243],"reasoning.":[245],"All":[246],"supporting":[247],"code":[248],"available":[250],"at":[251],"https://github.com/zfying/visfis":[252]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
