{"id":"https://openalex.org/W7130729681","doi":"https://doi.org/10.48550/arxiv.2602.17641","title":"FAMOSE: A ReAct Approach to Automated Feature Discovery","display_name":"FAMOSE: A ReAct Approach to Automated Feature Discovery","publication_year":2026,"publication_date":"2026-02-19","ids":{"openalex":"https://openalex.org/W7130729681","doi":"https://doi.org/10.48550/arxiv.2602.17641"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.17641","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009943357","display_name":"Keith Burghardt","orcid":"https://orcid.org/0000-0003-1164-9545"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Burghardt, Keith","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126521604","display_name":"Jienan Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jienan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126458224","display_name":"Sadman Sakib","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sakib, Sadman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126480578","display_name":"Yuning Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Yuning","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126481568","display_name":"Bo Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5009943357"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.6955999732017517,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.6955999732017517,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.05530000105500221,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.04800000041723251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.7508999705314636},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.7398999929428101},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6765000224113464},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5758000016212463},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5620999932289124},{"id":"https://openalex.org/keywords/feature-engineering","display_name":"Feature engineering","score":0.525600016117096},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.3684999942779541}],"concepts":[{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.7508999705314636},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.7398999929428101},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7365000247955322},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6765000224113464},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5997999906539917},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5758000016212463},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5620999932289124},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5378000140190125},{"id":"https://openalex.org/C2778827112","wikidata":"https://www.wikidata.org/wiki/Q22245680","display_name":"Feature engineering","level":3,"score":0.525600016117096},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.38929998874664307},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.3684999942779541},{"id":"https://openalex.org/C101814296","wikidata":"https://www.wikidata.org/wiki/Q5439685","display_name":"Feature model","level":3,"score":0.36410000920295715},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.3614000082015991},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2799000144004822},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.26579999923706055},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.17641","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.17641","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17641","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.17641","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.46551570296287537}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Feature":[0],"engineering":[1],"remains":[2],"a":[3,43,177],"critical":[4],"yet":[5],"challenging":[6],"bottleneck":[7],"in":[8,200],"machine":[9],"learning,":[10],"particularly":[11],"for":[12,87,124],"tabular":[13],"data,":[14],"as":[15,209],"identifying":[16],"optimal":[17],"features":[18,57,167],"from":[19],"an":[20,66,78],"exponentially":[21],"large":[22],"feature":[23,60,84,161,210],"space":[24],"traditionally":[25],"demands":[26],"substantial":[27],"domain":[28],"expertise.":[29],"To":[30,69],"address":[31],"this":[32],"challenge,":[33],"we":[34],"introduce":[35],"FAMOSE":[36,72,97],"(Feature":[37],"AugMentation":[38],"and":[39,55,62,90,120,163,180],"Optimal":[40],"Selection":[41],"agEnt),":[42],"novel":[44],"framework":[45,81],"that":[46,96,145,194,203],"leverages":[47],"the":[48,74,102,122,153,182],"ReAct":[49,80,151],"paradigm":[50],"to":[51,82,138,157,176,184],"autonomously":[52],"explore,":[53],"generate,":[54],"refine":[56],"while":[58,134],"integrating":[59],"selection":[61],"evaluation":[63,164],"tools":[64],"within":[65],"agent":[67],"architecture.":[68],"our":[70],"knowledge,":[71],"represents":[73],"first":[75],"application":[76],"of":[77],"agentic":[79],"automated":[83],"engineering,":[85],"especially":[86],"both":[88],"regression":[89,125],"classification":[91,105],"tasks.":[92],"Extensive":[93],"experiments":[94],"demonstrate":[95],"is":[98,149,174],"at":[99],"or":[100,169],"near":[101],"state-of-the-art":[103,123],"on":[104,118,132],"tasks":[106,108,126],"(especially":[107],"with":[109],"more":[110,136,187],"than":[111,140],"10K":[112],"instances,":[113],"where":[114],"ROC-AUC":[115],"increases":[116],"0.23%":[117],"average),":[119],"achieves":[121],"by":[127,130],"reducing":[128],"RMSE":[129],"2.0%":[131],"average,":[133],"remaining":[135],"robust":[137],"errors":[139],"other":[141],"algorithms.":[142],"We":[143],"hypothesize":[144],"FAMOSE's":[146],"strong":[147],"performance":[148],"because":[150],"allows":[152],"LLM":[154,183],"context":[155],"window":[156],"record":[158],"(via":[159],"iterative":[160],"discovery":[162],"steps)":[165],"what":[166],"did":[168,170],"not":[171],"work.":[172],"This":[173],"similar":[175],"few-shot":[178],"prompt":[179],"guides":[181],"invent":[185],"better,":[186],"innovative":[188],"features.":[189],"Our":[190],"work":[191],"offers":[192],"evidence":[193],"AI":[195],"agents":[196],"are":[197],"remarkably":[198],"effective":[199],"solving":[201],"problems":[202],"require":[204],"highly":[205],"inventive":[206],"solutions,":[207],"such":[208],"engineering.":[211]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-21T00:00:00"}
