{"id":"https://openalex.org/W7151362333","doi":"https://doi.org/10.48550/arxiv.2604.03380","title":"Noise Steering for Controlled Text Generation: Improving Diversity and Reading-Level Fidelity in Arabic Educational Story Generation","display_name":"Noise Steering for Controlled Text Generation: Improving Diversity and Reading-Level Fidelity in Arabic Educational Story Generation","publication_year":2026,"publication_date":"2026-04-03","ids":{"openalex":"https://openalex.org/W7151362333","doi":"https://doi.org/10.48550/arxiv.2604.03380"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.03380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.03380","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120308298","display_name":"Haziq Mohammad Khalid","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Khalid, Haziq Mohammad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002365604","display_name":"Salsabeel Shapsough","orcid":"https://orcid.org/0000-0002-8667-4799"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shapsough, Salsabeel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5035716630","display_name":"Imran Zualkernan","orcid":"https://orcid.org/0000-0002-1048-5633"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zualkernan, Imran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5120308298"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10103","display_name":"Reading and Literacy Development","score":0.38510000705718994,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10103","display_name":"Reading and Literacy Development","score":0.38510000705718994,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.3118000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.061799999326467514,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.6434000134468079},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.5501000285148621},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4426000118255615},{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.41909998655319214},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.40139999985694885},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.39089998602867126},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3727000057697296},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.364300012588501}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.663100004196167},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.6434000134468079},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.5501000285148621},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4426000118255615},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43790000677108765},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.41929998993873596},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.40139999985694885},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.39089998602867126},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3727000057697296},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.364300012588501},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C60069766","wikidata":"https://www.wikidata.org/wiki/Q357054","display_name":"Antenna diversity","level":3,"score":0.36239999532699585},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35350000858306885},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.34790000319480896},{"id":"https://openalex.org/C2777413886","wikidata":"https://www.wikidata.org/wiki/Q3276013","display_name":"Fluency","level":2,"score":0.34380000829696655},{"id":"https://openalex.org/C4199805","wikidata":"https://www.wikidata.org/wiki/Q2725903","display_name":"Gaussian noise","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.28760001063346863},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.26260000467300415},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.257099986076355},{"id":"https://openalex.org/C96455323","wikidata":"https://www.wikidata.org/wiki/Q13955","display_name":"Arabic","level":2,"score":0.2547000050544739}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.03380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.03380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.03380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.8937031626701355}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generating":[0],"diverse,":[1],"pedagogically":[2],"valid":[3],"stories":[4],"for":[5,146],"Arabic":[6],"early-grade":[7,97],"reading":[8,16,79,98,121],"assessments":[9],"requires":[10],"balancing":[11],"tight":[12],"constraints":[13],"on":[14,128],"vocabulary,":[15],"level,":[17],"and":[18,78,95,124],"narrative":[19,87],"structure":[20],"against":[21,69],"the":[22,41,110],"need":[23],"to":[24,136],"avoid":[25],"repetitive":[26],"plots":[27],"that":[28],"undermine":[29],"assessment":[30],"validity.":[31],"We":[32,64,131],"investigate":[33],"noise":[34,84,106,114],"steering,":[35],"injecting":[36],"calibrated":[37],"Gaussian":[38],"perturbations":[39],"into":[40],"internal":[42,133],"representations":[43],"of":[44],"transformer":[45],"models":[46,61],"at":[47],"inference":[48],"time,":[49],"as":[50],"a":[51,138],"training-free":[52],"diversity":[53,88,141],"method":[54],"evaluated":[55],"across":[56,100],"five":[57],"small":[58],"Arabic-centric":[59,102],"language":[60],"(7-9B":[62],"parameters).":[63],"compare":[65],"four":[66],"injection":[67,107],"strategies":[68],"high-temperature":[70],"sampling":[71,119],"baselines,":[72],"measuring":[73],"diversity,":[74],"quality,":[75],"constraint":[76,93],"adherence,":[77],"grade":[80,122],"level.":[81],"Residual":[82],"stream":[83],"consistently":[85],"improves":[86],"with":[89],"minimal":[90],"quality":[91],"or":[92],"cost":[94],"preserves":[96],"level":[99,123],"all":[101],"models.":[103,130],"Attention":[104],"entropy":[105],"(AENI)":[108],"stabilizes":[109],"otherwise":[111],"unreliable":[112],"attention-logit":[113],"while":[115],"recovering":[116],"quality.":[117],"High-temperature":[118],"inflates":[120],"causes":[125],"catastrophic":[126],"collapse":[127],"several":[129],"find":[132],"representation-level":[134],"perturbation":[135],"be":[137],"more":[139],"suitable":[140],"strategy":[142],"than":[143],"output-level":[144],"stochasticity":[145],"constrained":[147],"educational":[148],"content":[149],"generation.":[150]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2026-04-08T00:00:00"}
