{"id":"https://openalex.org/W7119516093","doi":"https://doi.org/10.48550/arxiv.2601.03878","title":"Understanding Specification-Driven Code Generation with LLMs: An Empirical Study Design","display_name":"Understanding Specification-Driven Code Generation with LLMs: An Empirical Study Design","publication_year":2026,"publication_date":"2026-01-07","ids":{"openalex":"https://openalex.org/W7119516093","doi":"https://doi.org/10.48550/arxiv.2601.03878"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.03878","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03878","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.03878","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122309492","display_name":"Giovanni Rosa","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rosa, Giovanni","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079148542","display_name":"David Moreno-Lumbreras","orcid":"https://orcid.org/0000-0002-5454-7808"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Moreno-Lumbreras, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Robles, Gregorio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robles, Gregorio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121085003","display_name":"Jesus M. Gonzalez-Barahona","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gonz\u00e1lez-Barahona, Jes\u00fas M.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5122309492"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.38440001010894775,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.38440001010894775,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10430","display_name":"Software Engineering Techniques and Practices","score":0.1080000028014183,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.09179999679327011,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/empirical-research","display_name":"Empirical research","score":0.6322000026702881},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5773000121116638},{"id":"https://openalex.org/keywords/code-generation","display_name":"Code generation","score":0.5299999713897705},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5081999897956848},{"id":"https://openalex.org/keywords/test-driven-development","display_name":"Test-driven development","score":0.48739999532699585},{"id":"https://openalex.org/keywords/static-program-analysis","display_name":"Static program analysis","score":0.4480000138282776},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41190001368522644},{"id":"https://openalex.org/keywords/software-development","display_name":"Software development","score":0.4047999978065491},{"id":"https://openalex.org/keywords/software-quality","display_name":"Software quality","score":0.38999998569488525},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.38749998807907104}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7533000111579895},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.6322000026702881},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.6205000281333923},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5773000121116638},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.5299999713897705},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5171999931335449},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5081999897956848},{"id":"https://openalex.org/C4478048","wikidata":"https://www.wikidata.org/wiki/Q950250","display_name":"Test-driven development","level":4,"score":0.48739999532699585},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.4480000138282776},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C529173508","wikidata":"https://www.wikidata.org/wiki/Q638608","display_name":"Software development","level":3,"score":0.4047999978065491},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.38999998569488525},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.38749998807907104},{"id":"https://openalex.org/C150292731","wikidata":"https://www.wikidata.org/wiki/Q1342704","display_name":"Code review","level":5,"score":0.35429999232292175},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.334199994802475},{"id":"https://openalex.org/C52913732","wikidata":"https://www.wikidata.org/wiki/Q857102","display_name":"Software design","level":4,"score":0.33329999446868896},{"id":"https://openalex.org/C509989072","wikidata":"https://www.wikidata.org/wiki/Q15188241","display_name":"Model-driven architecture","level":4,"score":0.32600000500679016},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C145644426","wikidata":"https://www.wikidata.org/wiki/Q169411","display_name":"Unified Modeling Language","level":3,"score":0.2913999855518341},{"id":"https://openalex.org/C2777466363","wikidata":"https://www.wikidata.org/wiki/Q17008971","display_name":"Design tool","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C53942775","wikidata":"https://www.wikidata.org/wiki/Q1211721","display_name":"Code coverage","level":3,"score":0.28110000491142273},{"id":"https://openalex.org/C2776542497","wikidata":"https://www.wikidata.org/wiki/Q5266672","display_name":"Development (topology)","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.2782000005245209},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27709999680519104},{"id":"https://openalex.org/C195672273","wikidata":"https://www.wikidata.org/wiki/Q6888132","display_name":"Model-based design","level":2,"score":0.27160000801086426},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.2635999917984009},{"id":"https://openalex.org/C2780330621","wikidata":"https://www.wikidata.org/wiki/Q7936609","display_name":"Visual modeling","level":4,"score":0.26179999113082886},{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.25929999351501465},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25440001487731934},{"id":"https://openalex.org/C116253237","wikidata":"https://www.wikidata.org/wiki/Q1437424","display_name":"Formal specification","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.03878","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03878","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.03878","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.03878","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.45886939764022827,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4],"increasingly":[5],"integrated":[6],"into":[7,128],"software":[8],"development":[9,133],"workflows,":[10],"yet":[11],"their":[12],"behavior":[13],"in":[14,109],"structured,":[15],"specification-driven":[16],"processes":[17],"remains":[18],"poorly":[19],"understood.":[20],"This":[21],"paper":[22],"presents":[23],"an":[24],"empirical":[25,126],"study":[26,102],"design":[27,130],"using":[28],"CURRANTE,":[29],"a":[30,37],"Visual":[31],"Studio":[32],"Code":[33],"extension":[34],"that":[35,67,135],"enables":[36],"human-in-the-loop":[38],"workflow":[39],"for":[40],"LLM-assisted":[41],"code":[42,141],"generation.":[43,142],"The":[44,101,122],"tool":[45,82],"guides":[46],"developers":[47],"through":[48],"three":[49],"sequential":[50],"stages--Specification,":[51],"Tests,":[52],"and":[53,60,64,98,111,117],"Function--allowing":[54],"them":[55],"to":[56,104],"define":[57],"requirements,":[58],"generate":[59],"refine":[61],"test":[62,112],"suites,":[63],"produce":[65],"functions":[66],"satisfy":[68],"those":[69],"tests.":[70],"Participants":[71],"will":[72,124],"solve":[73],"medium-difficulty":[74],"problems":[75],"from":[76],"the":[77,81,115,129],"LiveCodeBench":[78],"dataset,":[79],"while":[80],"records":[83],"fine-grained":[84],"interaction":[85],"logs,":[86],"effectiveness":[87],"metrics":[88],"(e.g.,":[89,96],"pass":[90],"rate,":[91],"all-pass":[92],"completion),":[93],"efficiency":[94],"indicators":[95],"time-to-pass),":[97],"iteration":[99],"behaviors.":[100],"aims":[103],"analyze":[105],"how":[106],"human":[107,137],"intervention":[108],"specification":[110],"refinement":[113],"influences":[114],"quality":[116],"dynamics":[118],"of":[119,131],"LLM-generated":[120],"code.":[121],"results":[123],"provide":[125],"insights":[127],"next-generation":[132],"environments":[134],"align":[136],"reasoning":[138],"with":[139],"model-driven":[140]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-01-09T00:00:00"}
