{"id":"https://openalex.org/W7119085441","doi":"https://doi.org/10.48550/arxiv.2601.02060","title":"Perish or Flourish? A Holistic Evaluation of Large Language Models for Code Generation in Functional Programming","display_name":"Perish or Flourish? A Holistic Evaluation of Large Language Models for Code Generation in Functional Programming","publication_year":2026,"publication_date":"2026-01-05","ids":{"openalex":"https://openalex.org/W7119085441","doi":"https://doi.org/10.48550/arxiv.2601.02060"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.02060","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02060","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.02060","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048243105","display_name":"Nico Lang","orcid":"https://orcid.org/0000-0001-8434-027X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lang, Nguyet-Anh H.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050525060","display_name":"Evan Lang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lang, Eric","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013306670","display_name":"Thanh Le-Cong","orcid":"https://orcid.org/0000-0002-9566-324X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Le-Cong, Thanh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122235975","display_name":"Bach Le","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Le, Bach","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5057073070","display_name":"Quyet\u2010Thang Huynh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huynh, Quyet-Thang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5048243105"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5568000078201294,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5568000078201294,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.0731000006198883,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.054999999701976776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/functional-programming","display_name":"Functional programming","score":0.6549999713897705},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6312000155448914},{"id":"https://openalex.org/keywords/programming-paradigm","display_name":"Programming paradigm","score":0.4787999987602234},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4284000098705292},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.41100001335144043},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.3901999890804291},{"id":"https://openalex.org/keywords/functional-equivalence","display_name":"Functional equivalence","score":0.3181999921798706},{"id":"https://openalex.org/keywords/program-analysis","display_name":"Program analysis","score":0.3181000053882599}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8039000034332275},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.7699999809265137},{"id":"https://openalex.org/C42383842","wikidata":"https://www.wikidata.org/wiki/Q193076","display_name":"Functional programming","level":2,"score":0.6549999713897705},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6312000155448914},{"id":"https://openalex.org/C34165917","wikidata":"https://www.wikidata.org/wiki/Q188267","display_name":"Programming paradigm","level":2,"score":0.4787999987602234},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4284000098705292},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.41290000081062317},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.41100001335144043},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.3901999890804291},{"id":"https://openalex.org/C2988012377","wikidata":"https://www.wikidata.org/wiki/Q29966452","display_name":"Functional equivalence","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C98183937","wikidata":"https://www.wikidata.org/wiki/Q2112188","display_name":"Program analysis","level":2,"score":0.3181000053882599},{"id":"https://openalex.org/C60051680","wikidata":"https://www.wikidata.org/wiki/Q30267","display_name":"Aspect-oriented programming","level":3,"score":0.31299999356269836},{"id":"https://openalex.org/C2777131603","wikidata":"https://www.wikidata.org/wiki/Q5508796","display_name":"Functional approach","level":2,"score":0.3077999949455261},{"id":"https://openalex.org/C2776245389","wikidata":"https://www.wikidata.org/wiki/Q962139","display_name":"Programming style","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.2904999852180481},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.2856999933719635},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.2554999887943268},{"id":"https://openalex.org/C199305712","wikidata":"https://www.wikidata.org/wiki/Q3205914","display_name":"Fifth-generation programming language","level":3,"score":0.2547999918460846},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.2529999911785126},{"id":"https://openalex.org/C11164408","wikidata":"https://www.wikidata.org/wiki/Q18657800","display_name":"Second-generation programming language","level":4,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.02060","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02060","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.02060","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.02060","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.5976970791816711}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Functional":[0],"programming":[1,50,57,81,140,156],"provides":[2,97],"strong":[3],"foundations":[4],"for":[5,31,135,224],"developing":[6],"reliable":[7],"and":[8,52,94,109,118,121,133,142,173,199,212,221],"secure":[9],"software":[10],"systems,":[11],"yet":[12],"its":[13],"adoption":[14],"remains":[15],"not":[16],"widespread":[17],"due":[18],"to":[19,37,113],"the":[20],"steep":[21],"learning":[22],"curve.":[23],"Recent":[24],"advances":[25],"in":[26,55,138,154,168,176],"Large":[27],"Language":[28],"Models":[29],"(LLMs)":[30],"code":[32,119,136,189,197],"generation":[33,137],"present":[34],"new":[35,77],"opportunities":[36],"lower":[38],"these":[39],"barriers.":[40],"However,":[41],"extensive":[42],"evaluations":[43],"of":[44,79,227],"LLMs":[45,184,206],"largely":[46],"focus":[47],"on":[48,74,87],"imperative":[49,146,180,192],"languages,":[51],"their":[53],"capabilities":[54],"functional":[56,116,139,155,170,188],"languages":[58,141,171],"(FP)":[59],"remain":[60,165],"underexplored.":[61],"To":[62],"address":[63],"this":[64,124],"gap,":[65],"we":[66,126,203],"introduce":[67],"FPEval,":[68],"a":[69,76],"holistic":[70],"evaluation":[71,99],"framework":[72],"built":[73],"FPBench,":[75],"benchmark":[78],"721":[80],"tasks":[82],"across":[83],"three":[84,88],"difficulty":[85],"levels":[86],"mainstream":[89],"FP":[90],"languages:":[91],"Haskell,":[92],"Ocaml":[93],"Scala.":[95],"FPEval":[96],"compehensive":[98],"infrastructures":[100],"with":[101,105,159,217],"both":[102,115,210],"test":[103,107],"validations":[104],"comprehensive":[106],"suites":[108],"static":[110,218],"analysis":[111,219],"tools":[112],"assess":[114],"correctness":[117,211],"style":[120,198],"maintainability.":[122,201],"Using":[123],"framework,":[125],"evaluate":[127],"state-of-the-art":[128],"LLMs,":[129],"including":[130],"GPT-3.5,":[131],"GPT-4o,":[132],"GPT-5,":[134],"Java":[143],"as":[144],"an":[145],"baseline.":[147],"Our":[148],"results":[149],"demonstrate":[150],"that":[151,190,205],"LLM":[152],"performance":[153],"improves":[157],"substantially":[158],"model":[160],"advancement;":[161],"however,":[162],"error":[163],"rates":[164],"significantly":[166],"higher":[167],"purely":[169],"(Haskell":[172],"OCaml)":[174],"than":[175],"hybrid":[177],"(Scala)":[178],"or":[179],"(Java)":[181],"languages.":[182],"Moreover,":[183],"frequently":[185],"generate":[186],"non-idiomatic":[187],"follows":[191],"patterns,":[193],"raising":[194],"concerns":[195],"about":[196],"long-term":[200],"Finally,":[202],"show":[204],"can":[207],"partially":[208],"self-repair":[209],"quality":[213],"issues":[214],"when":[215],"provided":[216],"feedback":[220],"hand-crafted":[222],"instructions":[223],"common":[225],"types":[226],"issues.":[228]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
