{"id":"https://openalex.org/W7148450440","doi":"https://doi.org/10.48550/arxiv.2604.00275","title":"Structure- and Event-Driven Frameworks for State Machine Modeling with Large Language Models","display_name":"Structure- and Event-Driven Frameworks for State Machine Modeling with Large Language Models","publication_year":2026,"publication_date":"2026-03-31","ids":{"openalex":"https://openalex.org/W7148450440","doi":"https://doi.org/10.48550/arxiv.2604.00275"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00275","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132804173","display_name":"Samer Abdulkarim","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Abdulkarim, Samer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132735008","display_name":"Evan Boyd","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boyd, Evan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132795219","display_name":"Karl Bridi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bridi, Karl","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132829940","display_name":"Alec Tufenkjian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tufenkjian, Alec","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132798804","display_name":"Boqi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Boqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132794886","display_name":"Gunter Mussbacher","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mussbacher, Gunter","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5132804173"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.18209999799728394,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11450","display_name":"Model-Driven Software Engineering Techniques","score":0.18209999799728394,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.15029999613761902,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.10239999741315842,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/finite-state-machine","display_name":"Finite-state machine","score":0.6672000288963318},{"id":"https://openalex.org/keywords/unified-modeling-language","display_name":"Unified Modeling Language","score":0.6352999806404114},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.6323000192642212},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5271000266075134},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.43790000677108765},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.43130001425743103},{"id":"https://openalex.org/keywords/modeling-language","display_name":"Modeling language","score":0.40950000286102295},{"id":"https://openalex.org/keywords/abstract-state-machines","display_name":"Abstract state machines","score":0.35749998688697815}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7293999791145325},{"id":"https://openalex.org/C167822520","wikidata":"https://www.wikidata.org/wiki/Q176452","display_name":"Finite-state machine","level":2,"score":0.6672000288963318},{"id":"https://openalex.org/C145644426","wikidata":"https://www.wikidata.org/wiki/Q169411","display_name":"Unified Modeling Language","level":3,"score":0.6352999806404114},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.6323000192642212},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5777999758720398},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5271000266075134},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47679999470710754},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4316999912261963},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.43130001425743103},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.40950000286102295},{"id":"https://openalex.org/C145243422","wikidata":"https://www.wikidata.org/wiki/Q333385","display_name":"Abstract state machines","level":3,"score":0.35749998688697815},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.3546999990940094},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.32179999351501465},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C207953454","wikidata":"https://www.wikidata.org/wiki/Q2528011","display_name":"Virtual finite-state machine","level":3,"score":0.31049999594688416},{"id":"https://openalex.org/C16671368","wikidata":"https://www.wikidata.org/wiki/Q230885","display_name":"State diagram","level":3,"score":0.296099990606308},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.29409998655319214},{"id":"https://openalex.org/C21285288","wikidata":"https://www.wikidata.org/wiki/Q2117885","display_name":"Systems Modeling Language","level":4,"score":0.2924000024795532},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C88977235","wikidata":"https://www.wikidata.org/wiki/Q787114","display_name":"Abstract machine","level":2,"score":0.27799999713897705},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.27639999985694885},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C181062253","wikidata":"https://www.wikidata.org/wiki/Q5421886","display_name":"Extended finite-state machine","level":3,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00275","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00275","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"UML":[0,54],"state":[1,12,55,110,137,160,175,265],"machine":[2,56,138,161,176,266],"design":[3],"is":[4,113,198],"a":[5,81,86,94,103,132,170,204,233,269],"critical":[6],"process":[7],"in":[8,135,147,274],"software":[9],"engineering.":[10],"Traditionally,":[11],"machines":[13],"are":[14,125,145],"manually":[15],"crafted":[16],"by":[17],"experienced":[18],"engineers":[19],"based":[20,127],"on":[21,128],"natural":[22],"language":[23],"requirements-a":[24],"time-consuming":[25],"and":[26,77,85,92,150,188,214,257],"error-prone":[27],"procedure.":[28],"Many":[29],"automated":[30,206,264],"approaches":[31],"exist":[32],"but":[33,243],"they":[34],"require":[35],"structured":[36],"NL":[37,66],"requirements.":[38,67],"In":[39,119],"this":[40,275],"paper,":[41],"we":[42],"investigate":[43],"the":[44,100,179,225,228,237,248,255,258],"capabilities":[45],"of":[46,72,184,210,227,260],"current":[47,261],"Large":[48],"Language":[49],"Models":[50],"to":[51,173,232],"fully":[52,201,205],"automate":[53],"generation":[57],"via":[58],"specialized":[59],"State":[60],"Machine":[61],"Frameworks":[62],"(SMFs)":[63],"from":[64,102,178],"non-structured":[65],"We":[68],"evaluate":[69],"two":[70,122],"types":[71],"state-of-the-art":[73],"LLMs":[74,168,262],"using":[75,192],"single-step":[76],"multi-step":[78],"prompting":[79],"approaches:":[80,130],"non-reasoning":[82,229],"LLM":[83,88,230,239],"GPT-4o":[84],"reasoning-focused":[87],"Claude":[89,193],"3.5":[90,194,241],"Sonnet,":[91],"introduce":[93],"novel":[95],"Hybrid":[96,222],"Approach":[97,223],"that":[98,166],"uses":[99],"output":[101],"Single-Prompt":[104,180],"Baseline":[105,181],"as":[106,236],"an":[107,117,152],"initial":[108],"draft":[109],"machine,":[111],"which":[112,136],"then":[114],"refined":[115],"through":[116],"SMF.":[118],"our":[120],"study,":[121],"distinct":[123],"SMFs":[124],"developed":[126],"human":[129],"(i)":[131],"Structure-Driven":[133],"SMF,":[134,154],"components":[139],"(states,":[140],"transitions,":[141],"guards,":[142],"actions,":[143],"etc.)":[144],"generated":[146],"sequential":[148],"steps,":[149],"(ii)":[151],"Event-Driven":[153],"where":[155],"identified":[156],"events":[157],"iteratively":[158],"guide":[159],"construction.":[162],"Our":[163,220,251],"experiments":[164],"indicate":[165],"while":[167],"demonstrate":[169],"promising":[171],"ability":[172],"generate":[174],"models":[177],"(e.g.,":[182,208],"F1-scores":[183,209],"0.90":[185],"for":[186,190,203,212,216,218,263,271],"states":[187],"0.75":[189],"transitions":[191],"Sonnet),":[195],"their":[196],"performance":[197,226],"not":[199,245],"yet":[200],"sufficient":[202],"solution":[207],"0.23":[211],"guards":[213],"0.00":[215],"actions":[217],"GPT-4o).":[219],"proposed":[221],"improves":[224],"(GPT-4o)":[231],"similar":[234],"level":[235],"reasoning":[238,249],"(Claude":[240],"Sonnet)":[242],"does":[244],"further":[246],"improve":[247],"LLM.":[250],"evaluation":[252],"highlights":[253],"both":[254],"potential":[256],"limitations":[259],"design,":[267],"providing":[268],"baseline":[270],"future":[272],"research":[273],"domain.":[276]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
