{"id":"https://openalex.org/W4412986206","doi":"https://doi.org/10.22152/programming-journal.org/2025/10/16","title":"Generating Inputs for Grammar Mining using Dynamic Symbolic Execution","display_name":"Generating Inputs for Grammar Mining using Dynamic Symbolic Execution","publication_year":2025,"publication_date":"2025-06-15","ids":{"openalex":"https://openalex.org/W4412986206","doi":"https://doi.org/10.22152/programming-journal.org/2025/10/16"},"language":"en","primary_location":{"id":"doi:10.22152/programming-journal.org/2025/10/16","is_oa":false,"landing_page_url":"https://doi.org/10.22152/programming-journal.org/2025/10/16","pdf_url":null,"source":{"id":"https://openalex.org/S4210199781","display_name":"The Art Science and Engineering of Programming","issn_l":"2473-7321","issn":["2473-7321"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Art, Science, and Engineering of Programming","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.03832","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064162245","display_name":"Andreas Pointner","orcid":"https://orcid.org/0000-0001-8642-1161"},"institutions":[{"id":"https://openalex.org/I4210136249","display_name":"University of Applied Sciences Upper Austria","ror":"https://ror.org/03jqp6d56","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210136249"]}],"countries":["AT"],"is_corresponding":true,"raw_author_name":"Andreas Pointner","raw_affiliation_strings":["University of Applied Sciences Upper Austria, Austria"],"affiliations":[{"raw_affiliation_string":"University of Applied Sciences Upper Austria, Austria","institution_ids":["https://openalex.org/I4210136249"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103053531","display_name":"Josef Pichler","orcid":"https://orcid.org/0009-0007-6908-0474"},"institutions":[{"id":"https://openalex.org/I4210136249","display_name":"University of Applied Sciences Upper Austria","ror":"https://ror.org/03jqp6d56","country_code":"AT","type":"education","lineage":["https://openalex.org/I4210136249"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Josef Pichler","raw_affiliation_strings":["University of Applied Sciences Upper Austria, Austria"],"affiliations":[{"raw_affiliation_string":"University of Applied Sciences Upper Austria, Austria","institution_ids":["https://openalex.org/I4210136249"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011251497","display_name":"Herbert Pr\u00e4hofer","orcid":"https://orcid.org/0000-0002-0139-8044"},"institutions":[{"id":"https://openalex.org/I121883995","display_name":"Johannes Kepler University of Linz","ror":"https://ror.org/052r2xn60","country_code":"AT","type":"education","lineage":["https://openalex.org/I121883995"]}],"countries":["AT"],"is_corresponding":false,"raw_author_name":"Herbert Pr\u00e4hofer","raw_affiliation_strings":["Johannes Kepler University Linz, Austria"],"affiliations":[{"raw_affiliation_string":"Johannes Kepler University Linz, Austria","institution_ids":["https://openalex.org/I121883995"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5064162245"],"corresponding_institution_ids":["https://openalex.org/I4210136249"],"apc_list":null,"apc_paid":null,"fwci":2.8599,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.92239719,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"10","issue":"2","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9617000222206116,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10820","display_name":"Fuzzy Logic and Control Systems","score":0.9544000029563904,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6906216144561768},{"id":"https://openalex.org/keywords/grammar","display_name":"Grammar","score":0.6213892698287964},{"id":"https://openalex.org/keywords/symbolic-execution","display_name":"Symbolic execution","score":0.5785216689109802},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.4654588997364044},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.323638916015625},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1798233687877655},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.05200359225273132}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6906216144561768},{"id":"https://openalex.org/C26022165","wikidata":"https://www.wikidata.org/wiki/Q8091","display_name":"Grammar","level":2,"score":0.6213892698287964},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.5785216689109802},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.4654588997364044},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.323638916015625},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1798233687877655},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.05200359225273132},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.22152/programming-journal.org/2025/10/16","is_oa":false,"landing_page_url":"https://doi.org/10.22152/programming-journal.org/2025/10/16","pdf_url":null,"source":{"id":"https://openalex.org/S4210199781","display_name":"The Art Science and Engineering of Programming","issn_l":"2473-7321","issn":["2473-7321"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Art, Science, and Engineering of Programming","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2508.03832","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.03832","pdf_url":"https://arxiv.org/pdf/2508.03832","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.03832","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.03832","pdf_url":"https://arxiv.org/pdf/2508.03832","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2905722102","https://openalex.org/W2155539595","https://openalex.org/W2752815423","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4239107164"],"abstract_inverted_index":{"A":[0],"vast":[1],"number":[2],"of":[3,37,64,94,133,161,208,267,309,323,375,440],"software":[4,65,135,168,407,447],"systems":[5,136],"include":[6],"components":[7,29,43],"that":[8,30,104,179,285,333,365,384],"parse":[9],"and":[10,47,59,257,291,338,360,404,413,438],"process":[11,31],"structured":[12,270,299],"input.":[13],"In":[14,79,124],"addition":[15],"to":[16,71,87,110,247,263,344],"programming":[17],"languages,":[18],"which":[19,74,305],"are":[20,27,188,228,366],"analyzed":[21],"by":[22,166,199,281,369,380],"compilers":[23],"or":[24,33,175],"interpreters,":[25],"there":[26],"numerous":[28,57],"standardized":[32],"proprietary":[34],"data":[35,107,128,141,187],"formats":[36],"varying":[38],"complexity.":[39],"Even":[40],"if":[41],"such":[42,53,351,370],"were":[44],"initially":[45],"developed":[46],"tested":[48],"based":[49],"on":[50,235],"a":[51,55,95,121,171,201,243,288,301,320],"specification,":[52],"as":[54,352],"grammar,":[56],"modifications":[58],"adaptations":[60],"over":[61],"the":[62,89,92,113,131,134,147,152,158,162,167,184,191,205,236,265,274,307,328,334,376,421,427,436,441],"course":[63],"evolution":[66],"can":[67,84,386,449],"make":[68],"it":[69,223,259,355,385],"impossible":[70],"precisely":[72],"determine":[73],"inputs":[75,155,209,278,310],"they":[76,227],"actually":[77],"accept.":[78],"this":[80,118,140,197,240,445],"situation,":[81],"grammar":[82,145,149,160,211,232,237,349,371,417],"mining":[83],"be":[85],"used":[86,143,219],"reconstruct":[88,450],"specification":[90,451],"in":[91,183,363,390,406],"form":[93],"grammar.":[96,193],"Established":[97],"approaches":[98],"already":[99,217],"produce":[100],"useful":[101],"results,":[102],"provided":[103],"sufficient":[105],"input":[106,114,127,163,186,214,248,271,290,296,396,425],"is":[108,120,137,142,279,298,378,400],"available":[109,185],"fully":[111,244],"cover":[112],"language.":[115],"However,":[116],"achieving":[117],"completeness":[119],"major":[122],"challenge.":[123],"practice,":[125],"only":[126,151,430],"recorded":[129],"during":[130],"operation":[132],"available.":[138],"If":[139],"for":[144,204,210,220,231,276,311,340,402,416,423],"mining,":[146],"resulting":[148],"reflects":[150],"actual":[153],"processed":[154],"but":[156,433],"not":[157,429],"complete":[159],"language":[164],"accepted":[165],"component.":[169],"As":[170],"result,":[172],"edge":[173,361],"cases":[174,362],"previously":[176],"supported":[177,379],"features":[178,359],"no":[180],"longer":[181],"appear":[182],"missing":[189],"from":[190,327,347,452],"generated":[192],"This":[194,398],"work":[195,241],"addresses":[196],"challenge":[198],"introducing":[200],"novel":[202,302],"approach":[203,246,251,335,428],"automatic":[206],"generation":[207,297,308],"mining.":[212,418],"Although":[213],"generators":[215],"have":[216],"been":[218],"fuzz":[221],"testing,":[222],"remains":[224],"unclear":[225],"whether":[226],"also":[229,434],"suitable":[230],"miners.":[233,372],"Building":[234],"miner":[238],"Mimid,":[239],"presents":[242],"automated":[245],"generation.":[249],"The":[250,314,373],"leverages":[252],"Dynamic":[253],"Symbolic":[254],"Execution":[255],"(DSE)":[256],"extends":[258,293],"with":[260,287],"two":[261],"mechanisms":[262],"overcome":[264],"limitations":[266],"DSE":[268],"regarding":[269],"parsers.":[272,455],"First,":[273],"search":[275],"new":[277],"guided":[280],"an":[282,410],"iterative":[283],"expansion":[284],"starts":[286],"single-character":[289],"gradually":[292],"it.":[294],"Second,":[295],"into":[300],"three-phase":[303],"approach,":[304,446],"separates":[306],"parser":[312],"functions.":[313],"proposed":[315],"method":[316,377],"was":[317],"evaluated":[318],"against":[319],"diverse":[321],"set":[322],"eleven":[324],"benchmark":[325],"applications":[326],"existing":[329,453],"literature.":[330],"Results":[331],"demonstrate":[332],"achieves":[336],"precision":[337],"recall":[339],"extracted":[341,442],"grammars":[342],"close":[343],"those":[345],"derived":[346],"state-of-the-art":[348],"miners":[350],"Mimid.":[353],"Notably,":[354],"successfully":[356],"uncovers":[357],"subtle":[358],"parsers":[364],"typically":[367],"missed":[368],"effectiveness":[374],"empirical":[381],"evidence,":[382],"showing":[383],"achieve":[387],"high":[388],"performance":[389],"various":[391],"domains":[392],"without":[393],"requiring":[394],"prior":[395],"samples.":[397],"contribution":[399],"significant":[401],"researchers":[403],"practitioners":[405],"engineering,":[408],"offering":[409],"automated,":[411],"scalable,":[412],"precise":[414],"solution":[415],"By":[419],"eliminating":[420],"need":[422],"manual":[424],"generation,":[426],"reduces":[431],"workload":[432],"enhances":[435],"robustness":[437],"comprehensiveness":[439],"grammars.":[443],"Following":[444],"engineers":[448],"(legacy)":[454]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
