{"id":"https://openalex.org/W7140322475","doi":"https://doi.org/10.48550/arxiv.2603.22519","title":"LLMON: An LLM-native Markup Language to Leverage Structure and Semantics at the LLM Interface","display_name":"LLMON: An LLM-native Markup Language to Leverage Structure and Semantics at the LLM Interface","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140322475","doi":"https://doi.org/10.48550/arxiv.2603.22519"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.22519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.22519","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130561210","display_name":"Michael Hind","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hind, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019254317","display_name":"Basel Shbita","orcid":"https://orcid.org/0009-0006-3154-3501"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shbita, Basel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130608839","display_name":"Bo Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Bo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130613536","display_name":"Farhan Ahmed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed, Farhan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051321506","display_name":"Chad DeLuca","orcid":"https://orcid.org/0009-0009-7690-7454"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"DeLuca, Chad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069329835","display_name":"Nathan Fulton","orcid":"https://orcid.org/0000-0002-4172-7631"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fulton, Nathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130586866","display_name":"David J. Cox","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cox, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130615276","display_name":"Dan Gutfreund","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gutfreund, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.19130000472068787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.19130000472068787,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.14470000565052032,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.06469999998807907,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markup-language","display_name":"Markup language","score":0.7865999937057495},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.49390000104904175},{"id":"https://openalex.org/keywords/ruleml","display_name":"RuleML","score":0.4749000072479248},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.41659998893737793},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.40880000591278076},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.3910999894142151},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.38199999928474426},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.336899995803833},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.33480000495910645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8450000286102295},{"id":"https://openalex.org/C45874996","wikidata":"https://www.wikidata.org/wiki/Q37045","display_name":"Markup language","level":3,"score":0.7865999937057495},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5943999886512756},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.49390000104904175},{"id":"https://openalex.org/C196388810","wikidata":"https://www.wikidata.org/wiki/Q631877","display_name":"RuleML","level":5,"score":0.4749000072479248},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.41659998893737793},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.40880000591278076},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.38199999928474426},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3418999910354614},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.336899995803833},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.33480000495910645},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.32420000433921814},{"id":"https://openalex.org/C189139006","wikidata":"https://www.wikidata.org/wiki/Q166074","display_name":"XHTML","level":4,"score":0.32089999318122864},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3188999891281128},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.31679999828338623},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.303600013256073},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C89505385","wikidata":"https://www.wikidata.org/wiki/Q47146","display_name":"User interface","level":2,"score":0.2793999910354614},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.27469998598098755},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.274399995803833},{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C20894473","wikidata":"https://www.wikidata.org/wiki/Q1116105","display_name":"Object model","level":3,"score":0.2603999972343445},{"id":"https://openalex.org/C509989072","wikidata":"https://www.wikidata.org/wiki/Q15188241","display_name":"Model-driven architecture","level":4,"score":0.2540999948978424},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.22519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.22519","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.22519","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Textual":[0],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"provide":[5,213],"a":[6,11,31,41,54,118,202],"simple":[7],"and":[8,20,34,56,79,108,135,145,169,188,209,212,232],"familiar":[9],"interface:":[10],"string":[12],"of":[13,111,178,218,223],"text":[14,113],"is":[15,37,148],"used":[16,129,157],"for":[17,158,221],"both":[18,48,222],"input":[19],"output.":[21],"However,":[22],"the":[23,71,106,112,174,184,198],"information":[24,125,199],"conveyed":[25,39],"to":[26,60,70,76,114,121,139,150],"an":[27,94,122,179,239],"LLM":[28],"often":[29],"has":[30],"richer":[32],"structure":[33,107],"semantics,":[35],"which":[36],"not":[38,66],"in":[40,117,141,201],"string.":[42],"For":[43],"example,":[44],"most":[45],"prompts":[46],"contain":[47],"instructions":[49],"(\"Summarize":[50],"this":[51,90],"paper":[52,59],"into":[53],"paragraph\")":[55],"data":[57],"(the":[58],"summarize),":[61],"but":[62],"these":[63,193,224],"are":[64,236],"usually":[65],"distinguished":[67],"when":[68],"passed":[69],"model.":[72],"This":[73,87,124,147],"can":[74,126,155,205],"lead":[75],"model":[77,131,133,142,207],"confusion":[78],"security":[80],"risks,":[81],"such":[82,161],"as":[83,162],"prompt":[84],"injection":[85],"attacks.":[86],"work":[88],"addresses":[89],"shortcoming":[91],"by":[92],"introducing":[93],"LLM-native":[95,180,240],"mark-up":[96],"language,":[97,182],"LLMON":[98,185,203],"(LLM":[99],"Object":[100],"Notation,":[101],"pronounced":[102],"\"Lemon\"),":[103],"that":[104,235],"enables":[105],"semantic":[109],"metadata":[110],"be":[115,128,156],"communicated":[116],"natural":[119],"way":[120],"LLM.":[123],"then":[127],"during":[130],"training,":[132],"prompting,":[134],"inference":[136,210],"implementation,":[137,211],"leading":[138],"improvements":[140],"accuracy,":[143],"safety,":[144],"security.":[146],"analogous":[149],"how":[151,190,197],"programming":[152],"language":[153,187],"types":[154],"many":[159],"purposes,":[160],"static":[163],"checking,":[164,168],"code":[165],"generation,":[166],"dynamic":[167],"IDE":[170],"highlighting.":[171],"We":[172,227],"discuss":[173,229],"general":[175],"design":[176,194],"requirements":[177],"markup":[181,186],"introduce":[183],"show":[189],"it":[191],"meets":[192],"requirements,":[195],"describe":[196],"contained":[200],"artifact":[204],"benefit":[206],"training":[208],"some":[214],"preliminary":[215],"empirical":[216],"evidence":[217],"its":[219],"value":[220],"use":[225],"cases.":[226],"also":[228],"broader":[230],"issues":[231],"research":[233],"opportunities":[234],"enabled":[237],"with":[238],"approach.":[241]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-26T00:00:00"}
