{"id":"https://openalex.org/W7155555069","doi":"https://doi.org/10.48550/arxiv.2604.21584","title":"CoFEE: Reasoning Control for LLM-Based Feature Discovery","display_name":"CoFEE: Reasoning Control for LLM-Based Feature Discovery","publication_year":2026,"publication_date":"2026-04-23","ids":{"openalex":"https://openalex.org/W7155555069","doi":"https://doi.org/10.48550/arxiv.2604.21584"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.21584","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21584","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.21584","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116182526","display_name":"Maximilian Westermann","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Westermann, Maximilian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134526574","display_name":"Ben Griffin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Griffin, Ben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134534473","display_name":"Aaron Ontoyin Yin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Aaron Ontoyin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134563171","display_name":"Zakari Salifu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Salifu, Zakari","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134483749","display_name":"Yagiz Ihlamur","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ihlamur, Yagiz","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134510598","display_name":"Kelvin Amoaba","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amoaba, Kelvin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134524509","display_name":"Joseph Ternasky","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ternasky, Joseph","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114658551","display_name":"Fuat Alican","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alican, Fuat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5093557649","display_name":"Yigit Ihlamur","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ihlamur, Yigit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.42239999771118164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.42239999771118164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.07050000131130219,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.05640000104904175,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6345999836921692},{"id":"https://openalex.org/keywords/backtracking","display_name":"Backtracking","score":0.4546999931335449},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.4383000135421753},{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.4153999984264374},{"id":"https://openalex.org/keywords/chaining","display_name":"Chaining","score":0.4081999957561493},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4043999910354614},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.36090001463890076},{"id":"https://openalex.org/keywords/predictability","display_name":"Predictability","score":0.3578000068664551},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.353300005197525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6636999845504761},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6345999836921692},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6057000160217285},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5507000088691711},{"id":"https://openalex.org/C156884757","wikidata":"https://www.wikidata.org/wiki/Q798554","display_name":"Backtracking","level":2,"score":0.4546999931335449},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.4383000135421753},{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.4153999984264374},{"id":"https://openalex.org/C49020025","wikidata":"https://www.wikidata.org/wiki/Q1059099","display_name":"Chaining","level":2,"score":0.4081999957561493},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4043999910354614},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.36090001463890076},{"id":"https://openalex.org/C197640229","wikidata":"https://www.wikidata.org/wiki/Q2534066","display_name":"Predictability","level":2,"score":0.3578000068664551},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.353300005197525},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.3244999945163727},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.3192000091075897},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.289900004863739},{"id":"https://openalex.org/C142614401","wikidata":"https://www.wikidata.org/wiki/Q777433","display_name":"Forward chaining","level":3,"score":0.289000004529953},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.2782999873161316},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C183521366","wikidata":"https://www.wikidata.org/wiki/Q7256422","display_name":"Psychology of reasoning","level":4,"score":0.2574999928474426},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.2547000050544739},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.21584","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21584","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.21584","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.21584","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7203501462936401,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Feature":[0,94],"discovery":[1],"from":[2,150],"complex":[3],"unstructured":[4],"data":[5,228],"is":[6,198,242],"fundamentally":[7],"a":[8,19,41,97,114,168],"reasoning":[9,78,98,165,240],"problem:":[10],"it":[11],"requires":[12],"identifying":[13],"abstractions":[14],"that":[15,101,173,197],"are":[16,49],"predictive":[17],"of":[18,32,62,129,163,250],"target":[20],"outcome":[21],"while":[22,205],"avoiding":[23],"leakage,":[24],"proxies,":[25],"and":[26,146,157,160,210,248],"post-outcome":[27],"signals.":[28],"With":[29],"the":[30,107,127,134,202,227],"introduction":[31],"ever-improving":[33],"Large":[34],"Language":[35],"Models":[36],"(LLMs),":[37],"our":[38,237],"method":[39,43],"provides":[40],"structured":[42,123],"for":[44,52,86,230],"addressing":[45],"this":[46,53,74],"challenge.":[47],"LLMs":[48,81],"well":[50],"suited":[51],"task":[54],"by":[55,82,133,213],"being":[56],"able":[57],"to":[58,70],"process":[59],"large":[60],"amounts":[61],"information,":[63],"but":[64],"unconstrained":[65,186],"feature":[66,88,111,217,252],"generation":[67],"can":[68],"lead":[69],"weak":[71],"features.":[72],"In":[73,167],"work,":[75],"we":[76,171,219],"study":[77],"control":[79,99,241],"in":[80,105,143,236,246],"inducing":[83],"cognitive":[84,103,119,175],"behaviors":[85,104,120,137,176],"improving":[87],"discovery.":[89,112,231,253],"We":[90],"introduce":[91],"CoFEE":[92,190],"(Cognitive":[93],"Engineering":[95],"Engine),":[96],"framework":[100],"enforces":[102],"how":[106],"LLM":[108,188],"reasons":[109],"during":[110],"From":[113],"machine":[115],"learning":[116],"perspective,":[117],"these":[118],"act":[121],"as":[122],"inductive":[124],"biases":[125],"over":[126],"space":[128],"candidate":[130],"features":[131,178,209,224],"generated":[132],"model.":[135],"These":[136],"have":[138],"been":[139],"exploited":[140],"with":[141,179,244],"success":[142],"ML":[144],"models,":[145],"include":[147],"backward":[148],"chaining":[149],"outcomes,":[151],"subgoal":[152],"decomposition,":[153],"verification":[154],"against":[155],"observability":[156],"leakage":[158],"criteria,":[159],"explicit":[161],"backtracking":[162],"rejected":[164],"paths.":[166],"controlled":[169],"comparison,":[170],"show":[172],"enforcing":[174],"yields":[177],"higher":[180,200],"empirical":[181],"predictability":[182],"than":[183,201],"those":[184],"under":[185],"vanilla":[187,203],"prompts.":[189],"achieves":[191],"an":[192],"average":[193],"Success":[194],"Rate":[195],"Score":[196],"15.2%":[199],"approach,":[204],"generating":[206],"29%":[207],"fewer":[208],"reducing":[211],"costs":[212],"53.3%.":[214],"Using":[215],"held-out":[216],"evaluation,":[218],"assess":[220],"whether":[221],"cognitively":[222],"induced":[223],"generalize":[225],"beyond":[226],"used":[229],"Our":[232],"results":[233],"indicate":[234],"that,":[235],"evaluated":[238],"setting,":[239],"associated":[243],"improvements":[245],"quality":[247],"efficiency":[249],"LLM-based":[251]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-25T00:00:00"}
