{"id":"https://openalex.org/W7152504608","doi":"https://doi.org/10.48550/arxiv.2604.06559","title":"ExplainFuzz: Explainable and Constraint-Conditioned Test Generation with Probabilistic Circuits","display_name":"ExplainFuzz: Explainable and Constraint-Conditioned Test Generation with Probabilistic Circuits","publication_year":2026,"publication_date":"2026-04-08","ids":{"openalex":"https://openalex.org/W7152504608","doi":"https://doi.org/10.48550/arxiv.2604.06559"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.06559","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06559","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.06559","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133295330","display_name":"Anna\u00eblle Baiget","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Baiget, Anna\u00eblle","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089855486","display_name":"Jaron Maene","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maene, Jaron","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133251368","display_name":"Seongmin Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Seongmin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133262515","display_name":"Benjie Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Benjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133242648","display_name":"Guy Van den Broeck","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Broeck, Guy Van den","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5049451101","display_name":"Miryung Kim","orcid":"https://orcid.org/0000-0003-3802-1512"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Miryung","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5133295330"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.6754000186920166,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.6754000186920166,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.0421999990940094,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.03220000118017197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7734000086784363},{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.5098000168800354},{"id":"https://openalex.org/keywords/grammar","display_name":"Grammar","score":0.420199990272522},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.4081000089645386},{"id":"https://openalex.org/keywords/probabilistic-relevance-model","display_name":"Probabilistic relevance model","score":0.39890000224113464},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.33500000834465027},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.3292999863624573}],"concepts":[{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7734000086784363},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7682999968528748},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.5098000168800354},{"id":"https://openalex.org/C26022165","wikidata":"https://www.wikidata.org/wiki/Q8091","display_name":"Grammar","level":2,"score":0.420199990272522},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.4081000089645386},{"id":"https://openalex.org/C143017306","wikidata":"https://www.wikidata.org/wiki/Q3318133","display_name":"Probabilistic relevance model","level":4,"score":0.39890000224113464},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3513999879360199},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3483999967575073},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.33500000834465027},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.3292999863624573},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.3248000144958496},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2955999970436096},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.2761000096797943},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25459998846054077}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.06559","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06559","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.06559","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.06559","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6405107378959656,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Understanding":[0],"and":[1,15,25,51,68,77,90,130,141,155,190],"explaining":[2],"the":[3,105,139,166,200,216,225],"structure":[4],"of":[5,108,143,168,202,219,227],"generated":[6,100,144],"test":[7,58,74,237],"inputs":[8,37,75,97,127,169],"is":[9,211],"essential":[10],"for":[11,234],"effective":[12],"software":[13],"testing":[14],"debugging.":[16],"Existing":[17],"approaches--including":[18],"grammar-based":[19,73],"fuzzers,":[20],"probabilistic":[21,49,123,242],"Context-Free":[22,82],"Grammars":[23],"(pCFGs),":[24],"Large":[26],"Language":[27],"Models":[28],"(LLMs)--suffer":[29],"from":[30,80,184,191],"critical":[31],"limitations.":[32],"They":[33],"frequently":[34],"produce":[35],"ill-formed":[36],"that":[38,61,136,170,239],"fail":[39],"to":[40,46,66,110,125,151,176,186,193,214,229],"reflect":[41],"realistic":[42],"data":[43],"distributions,":[44],"struggle":[45],"capture":[47],"context-sensitive":[48],"dependencies,":[50],"lack":[52],"explainability.":[53],"We":[54],"introduce":[55],"ExplainFuzz,":[56],"a":[57,81,87,115,172,203,232],"generation":[59,238],"framework":[60],"leverages":[62],"Probabilistic":[63],"Circuits":[64],"(PCs)":[65],"learn":[67],"query":[69,116],"structured":[70],"distributions":[71],"over":[72,207],"interpretably":[76],"controllably.":[78],"Starting":[79],"Grammar":[83],"(CFG),":[84],"ExplainFuzz":[85,103,137,163,180],"compiles":[86],"grammar-aware":[88,177],"PC":[89],"trains":[91],"it":[92],"on":[93],"existing":[94],"inputs.":[95,221],"New":[96],"are":[98],"then":[99],"via":[101],"sampling.":[102],"utilizes":[104],"conditioning":[106,161],"capability":[107],"PCs":[109,228],"incorporate":[111],"test-specific":[112],"constraints":[113],"(e.g.,":[114],"must":[117],"have":[118],"GROUP":[119],"BY),":[120],"enabling":[121],"constrained":[122],"sampling":[124],"generate":[126],"satisfying":[128],"grammar":[129],"user-provided":[131,173],"constraints.":[132],"Our":[133],"results":[134,198],"show":[135],"improves":[138],"coherence":[140],"realism":[142],"inputs,":[145],"achieving":[146],"significant":[147],"perplexity":[148],"reduction":[149],"compared":[150],"pCFGs,":[152],"grammar-unaware":[153],"PCs,":[154],"LLMs.":[156],"By":[157],"leveraging":[158],"its":[159],"native":[160],"capability,":[162],"significantly":[164],"enhances":[165],"diversity":[167],"satisfy":[171],"constraint.":[174],"Compared":[175],"mutational":[178,208],"fuzzing,":[179,209],"increases":[181],"bug-triggering":[182],"rates":[183],"35%":[185],"63%":[187],"in":[188,195],"SQL":[189],"10%":[192],"100%":[194],"XML.":[196],"These":[197,222],"demonstrate":[199],"power":[201],"learned":[204],"input":[205],"distribution":[206],"which":[210],"often":[212],"limited":[213],"exploring":[215],"local":[217],"neighborhood":[218],"seed":[220],"capabilities":[223],"highlight":[224],"potential":[226],"serve":[230],"as":[231],"foundation":[233],"grammar-aware,":[235],"controllable":[236],"captures":[240],"context-sensitive,":[241],"dependencies.":[243]},"counts_by_year":[],"updated_date":"2026-04-10T06:07:51.998497","created_date":"2026-04-10T00:00:00"}
