{"id":"https://openalex.org/W7133344426","doi":"https://doi.org/10.48550/arxiv.2603.00883","title":"Knowledge without Wisdom: Measuring Misalignment between LLMs and Intended Impact","display_name":"Knowledge without Wisdom: Measuring Misalignment between LLMs and Intended Impact","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133344426","doi":"https://doi.org/10.48550/arxiv.2603.00883"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00883","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00883","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00883","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127902874","display_name":"Michael Hardy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hardy, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5069435977","display_name":"Yunsung Kim","orcid":"https://orcid.org/0000-0002-2829-574X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Yunsung","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.21089999377727509,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.21089999377727509,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.1808999925851822,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.07249999791383743,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.5875999927520752},{"id":"https://openalex.org/keywords/voting","display_name":"Voting","score":0.5688999891281128},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.5648999810218811},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4860000014305115},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4763000011444092},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.446399986743927},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.4291999936103821}],"concepts":[{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.5875999927520752},{"id":"https://openalex.org/C520049643","wikidata":"https://www.wikidata.org/wiki/Q189760","display_name":"Voting","level":3,"score":0.5688999891281128},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.5648999810218811},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4991999864578247},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4860000014305115},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4763000011444092},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.446399986743927},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.4291999936103821},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.40290001034736633},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.3905999958515167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3874000012874603},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3495999872684479},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.3246000111103058},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3237000107765198},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.322299987077713},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3131999969482422},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.2858000099658966},{"id":"https://openalex.org/C90559484","wikidata":"https://www.wikidata.org/wiki/Q778379","display_name":"Expression (computer science)","level":2,"score":0.28459998965263367},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2639000117778778},{"id":"https://openalex.org/C3020580240","wikidata":"https://www.wikidata.org/wiki/Q663272","display_name":"Expert opinion","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.2535000145435333}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00883","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00883","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00883","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00883","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8567756414413452,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LLMs":[0,39,79,180],"increasingly":[1],"excel":[2],"on":[3,21,45,60,72],"AI":[4],"benchmarks,":[5,22],"but":[6],"doing":[7],"so":[8],"does":[9],"not":[10],"guarantee":[11],"validity":[12],"for":[13,132,154,165],"downstream":[14,23,84],"tasks.":[15,32,74,161],"This":[16],"study":[17],"contrasts":[18],"LLM":[19,125],"alignment":[20,168],"tasks,":[24],"and,":[25],"importantly":[26],"the":[27,35,49,94,157],"intended":[28,95],"impact":[29,96],"of":[30,37,48,53,86,97,124,134,156,169,179],"those":[31],"We":[33,120,162],"evaluate":[34],"performance":[36],"leading":[38],"(i.e.,":[40],"generative":[41],"pre-trained":[42],"base":[43],"models)":[44],"difficult-to-verify":[46],"tasks":[47,62,171],"teaching":[50,87],"and":[51,89,110,139,172],"learning":[52,99],"schoolchildren.":[54],"Across":[55],"all":[56,135],"LLMs,":[57,148],"inter-model":[58],"behaviors":[59,71],"disparate":[61],"correlate":[63],"higher":[64],"than":[65],"they":[66],"do":[67],"with":[68,83,93,118],"expert":[69],"human":[70],"target":[73],"These":[75],"biases":[76],"shared":[77,146],"across":[78,147],"are":[80],"poorly":[81],"aligned":[82,92],"measures":[85],"quality":[88],"often":[90],"negatively":[91],"student":[98],"outcomes.":[100],"Further,":[101],"we":[102],"find":[103],"multi-model":[104],"ensembles,":[105],"both":[106],"unanimous":[107],"model":[108],"voting":[109],"expert-weighting":[111],"by":[112],"benchmark":[113],"performance,":[114],"further":[115],"exacerbate":[116],"misalignment":[117,137,143,158],"learning.":[119],"measure":[121],"that":[122,140,150],"selection":[123],"and/or":[126],"prompting":[127],"strategy":[128],"only":[129],"reliably":[130],"accounts":[131,153],"$15\\%$":[133],"measured":[136],"error":[138,144],"variation":[141],"in":[142,159,181],"is":[145],"suggesting":[149],"common":[151],"pretraining":[152],"much":[155],"these":[160],"demonstrate":[163],"methods":[164],"robustly":[166],"measuring":[167],"complex":[170],"provide":[173],"unique":[174],"insights":[175],"into":[176],"practical":[177],"applications":[178],"high-noise":[182],"contexts.":[183]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-04T00:00:00"}
