{"id":"https://openalex.org/W7157221460","doi":"https://doi.org/10.48550/arxiv.2604.24700","title":"Green Shielding: A User-Centric Approach Towards Trustworthy AI","display_name":"Green Shielding: A User-Centric Approach Towards Trustworthy AI","publication_year":2026,"publication_date":"2026-04-27","ids":{"openalex":"https://openalex.org/W7157221460","doi":"https://doi.org/10.48550/arxiv.2604.24700"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.24700","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24700","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.24700","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134802158","display_name":"Aaron J. Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Aaron J.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134755473","display_name":"Nicolas Sanchez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanchez, Nicolas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134769479","display_name":"Hao Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134819956","display_name":"Ruijiang Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Ruijiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048683908","display_name":"Jaskaran Bains","orcid":"https://orcid.org/0000-0001-7880-5878"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bains, Jaskaran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040153546","display_name":"Katrin Jaradeh","orcid":"https://orcid.org/0000-0002-0357-5892"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jaradeh, Katrin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134756409","display_name":"Zhen Xiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiang, Zhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134777253","display_name":"Bo Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134770396","display_name":"Feng Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Feng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088336297","display_name":"Aaron E. Kornblith","orcid":"https://orcid.org/0000-0002-1344-575X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kornblith, Aaron","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134780253","display_name":"Bin Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Bin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5134802158"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.6033999919891357,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.6033999919891357,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.14319999516010284,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.04619999974966049,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.6876999735832214},{"id":"https://openalex.org/keywords/operationalization","display_name":"Operationalization","score":0.6622999906539917},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.574400007724762},{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.5378999710083008},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.49959999322891235},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.4659999907016754},{"id":"https://openalex.org/keywords/soundness","display_name":"Soundness","score":0.4207000136375427}],"concepts":[{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.6876999735832214},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6791999936103821},{"id":"https://openalex.org/C9354725","wikidata":"https://www.wikidata.org/wiki/Q286017","display_name":"Operationalization","level":2,"score":0.6622999906539917},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.574400007724762},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.5378999710083008},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.49959999322891235},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48590001463890076},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.4659999907016754},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4348999857902527},{"id":"https://openalex.org/C39920170","wikidata":"https://www.wikidata.org/wiki/Q693083","display_name":"Soundness","level":2,"score":0.4207000136375427},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.40959998965263367},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3580999970436096},{"id":"https://openalex.org/C2776493592","wikidata":"https://www.wikidata.org/wiki/Q5158717","display_name":"Succinctness","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30149999260902405},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.2939999997615814},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.2800999879837036},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.27639999985694885},{"id":"https://openalex.org/C162376815","wikidata":"https://www.wikidata.org/wiki/Q2158281","display_name":"Frequentist inference","level":4,"score":0.273499995470047},{"id":"https://openalex.org/C100521375","wikidata":"https://www.wikidata.org/wiki/Q2015382","display_name":"Competence (human resources)","level":2,"score":0.2732999920845032},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2632000148296356},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.26030001044273376},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2533999979496002},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.24700","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24700","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.24700","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.24700","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6508105397224426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2],"(LLMs)":[3],"are":[4],"increasingly":[5],"deployed,":[6],"yet":[7],"their":[8],"outputs":[9,200],"can":[10,193],"be":[11],"highly":[12,181],"sensitive":[13],"to":[14,221],"routine,":[15],"non-adversarial":[16],"variation":[17,49,134],"in":[18,79,99,208,214],"how":[19,46],"users":[20],"phrase":[21],"queries,":[22,109],"a":[23,36,105],"gap":[24],"not":[25],"well":[26],"addressed":[27],"by":[28,44,86],"existing":[29],"red-teaming":[30],"efforts.":[31],"We":[32,53,125],"propose":[33],"Green":[34,97],"Shielding,":[35],"user-centric":[37],"agenda":[38,56,218],"for":[39,120,205],"building":[40],"evidence-backed":[41],"deployment":[42,207],"guidance":[43,204],"characterizing":[45],"benign":[47],"input":[48,133],"shifts":[50,152],"model":[51,83,141,199],"behavior.":[52,84],"operationalize":[54],"this":[55],"through":[57,102],"the":[58,80,87,217],"CUE":[59],"criteria:":[60],"benchmarks":[61],"with":[62,92,111],"authentic":[63],"Context,":[64],"reference":[65,113],"standards":[66],"and":[67,73,90,116,135,171,183,201,225],"metrics":[68,119],"that":[69,75,130,137,190],"capture":[70,131],"true":[71],"Utility,":[72],"perturbations":[74],"reflect":[76],"realistic":[77],"variations":[78],"Elicitation":[81],"of":[82,107,180,198],"Guided":[85],"PCS":[88],"framework":[89],"developed":[91],"practicing":[93],"physicians,":[94],"we":[95],"instantiate":[96],"Shielding":[98],"medical":[100,215],"diagnosis":[101,114,123],"HealthCareMagic-Diagnosis":[103],"(HCM-Dx),":[104],"benchmark":[106],"patient-authored":[108],"together":[110],"structured":[112],"sets":[115],"clinically":[117,144],"grounded":[118],"evaluating":[121],"differential":[122],"lists.":[124],"also":[126],"study":[127],"perturbation":[128],"regimes":[129],"routine":[132],"show":[136,189],"prompt-level":[138],"factors":[139,164],"shift":[140,195],"behavior":[142],"along":[143],"meaningful":[145],"dimensions.":[146],"Across":[147],"multiple":[148],"frontier":[149],"LLMs,":[150],"these":[151,187],"trace":[153],"out":[154],"Pareto-like":[155],"tradeoffs.":[156],"In":[157],"particular,":[158],"neutralization,":[159],"which":[160],"removes":[161],"common":[162],"user-level":[163],"while":[165],"preserving":[166],"clinical":[167],"content,":[168],"increases":[169],"plausibility":[170],"yields":[172],"more":[173],"concise,":[174],"clinician-like":[175],"differentials,":[176],"but":[177],"reduces":[178],"coverage":[179],"likely":[182],"safety-critical":[184],"conditions.":[185],"Together,":[186],"results":[188],"interaction":[191],"choices":[192],"systematically":[194],"task-relevant":[196],"properties":[197],"support":[202],"user-facing":[203],"safer":[206],"high-stakes":[209],"domains.":[210],"Although":[211],"instantiated":[212],"here":[213],"diagnosis,":[216],"extends":[219],"naturally":[220],"other":[222],"decision-support":[223],"settings":[224],"agentic":[226],"AI":[227],"systems.":[228]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-29T00:00:00"}
