{"id":"https://openalex.org/W4416709217","doi":"https://doi.org/10.48550/arxiv.2509.02227","title":"Application Of Large Language Models For The Extraction Of Information From Particle Accelerator Technical Documentation","display_name":"Application Of Large Language Models For The Extraction Of Information From Particle Accelerator Technical Documentation","publication_year":2025,"publication_date":"2025-09-02","ids":{"openalex":"https://openalex.org/W4416709217","doi":"https://doi.org/10.48550/arxiv.2509.02227"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2509.02227","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.02227","pdf_url":"https://arxiv.org/pdf/2509.02227","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.02227","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012805315","display_name":"Qing Dai","orcid":"https://orcid.org/0000-0002-8578-1568"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dai, Qing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120476549","display_name":"Rasmus Ischebeck","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ischebeck, Rasmus","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064532130","display_name":"M. Sapinski","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sapinski, Maruisz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044853035","display_name":"Adam Grycner","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Grycner, Adam","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5012805315"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.07460000365972519,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.07460000365972519,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.07000000029802322,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13726","display_name":"International Science and Diplomacy","score":0.06400000303983688,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.7854999899864197},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.7796000242233276},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5609999895095825},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.46549999713897705},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4099999964237213},{"id":"https://openalex.org/keywords/domain-specific-language","display_name":"Domain-specific language","score":0.3573000133037567}],"concepts":[{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.7854999899864197},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.7796000242233276},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6618000268936157},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5609999895095825},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.46549999713897705},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4099999964237213},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.3921000063419342},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3765999972820282},{"id":"https://openalex.org/C135257023","wikidata":"https://www.wikidata.org/wiki/Q691358","display_name":"Domain-specific language","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.35420000553131104},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C52421305","wikidata":"https://www.wikidata.org/wiki/Q1151499","display_name":"Particle filter","level":3,"score":0.2761000096797943},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C25688753","wikidata":"https://www.wikidata.org/wiki/Q1413406","display_name":"Technical documentation","level":3,"score":0.2727999985218048},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.26159998774528503},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C545109879","wikidata":"https://www.wikidata.org/wiki/Q5157412","display_name":"Computer Applications","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2509.02227","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.02227","pdf_url":"https://arxiv.org/pdf/2509.02227","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.02227","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.02227","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.02227","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.02227","pdf_url":"https://arxiv.org/pdf/2509.02227","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"large":[1,36],"set":[2],"of":[3,6,14,35,46,62,68,79,91,103,115,123,137],"technical":[4,51],"documentation":[5],"legacy":[7,73],"accelerator":[8,50],"systems,":[9],"coupled":[10],"with":[11],"the":[12,18,33,44,60,66,89,101,113,135],"retirement":[13],"experienced":[15],"personnel,":[16],"underscores":[17],"urgent":[19],"need":[20],"for":[21,130],"efficient":[22],"methods":[23],"to":[24,40,58,82,139],"preserve":[25],"and":[26,42,96,121,127,148],"transfer":[27],"specialized":[28,84,153],"knowledge.":[29],"This":[30,132],"paper":[31],"explores":[32],"application":[34],"language":[37],"models":[38],"(LLMs),":[39],"automate":[41],"enhance":[43],"extraction":[45],"information":[47],"from":[48],"particle":[49],"documents.":[52],"By":[53],"exploiting":[54],"LLMs,":[55,117],"we":[56,111],"aim":[57],"address":[59],"challenges":[61],"knowledge":[63,147],"retention,":[64],"enabling":[65],"retrieval":[67],"domain":[69],"expertise":[70],"embedded":[71],"in":[72,93,144,151],"documentation.":[74],"We":[75],"present":[76],"initial":[77],"results":[78],"adapting":[80],"LLMs":[81,92,138],"this":[83],"domain.":[85],"Our":[86],"evaluation":[87],"demonstrates":[88],"effectiveness":[90],"extracting,":[94],"summarizing,":[95],"organizing":[97],"knowledge,":[98],"significantly":[99],"reducing":[100],"risk":[102],"losing":[104],"valuable":[105],"insights":[106],"as":[107,119],"personnel":[108],"retire.":[109],"Furthermore,":[110],"discuss":[112],"limitations":[114],"current":[116],"such":[118],"interpretability":[120],"handling":[122],"rare":[124],"domain-specific":[125],"terms,":[126],"propose":[128],"strategies":[129],"improvement.":[131],"work":[133],"highlights":[134],"potential":[136],"play":[140],"a":[141],"pivotal":[142],"role":[143],"preserving":[145],"institutional":[146],"ensuring":[149],"continuity":[150],"highly":[152],"fields.":[154]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
