{"id":"https://openalex.org/W7160988150","doi":"https://doi.org/10.48550/arxiv.2605.11769","title":"Safety-Oriented Evaluation of Language Understanding Systems for Air Traffic Control","display_name":"Safety-Oriented Evaluation of Language Understanding Systems for Air Traffic Control","publication_year":2026,"publication_date":"2026-05-12","ids":{"openalex":"https://openalex.org/W7160988150","doi":"https://doi.org/10.48550/arxiv.2605.11769"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.11769","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11769","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.11769","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136009058","display_name":"Yujing Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Yujing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136062257","display_name":"Yash Guleria","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guleria, Yash","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091693318","display_name":"Duc-Thinh Pham","orcid":"https://orcid.org/0000-0001-5156-8171"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pham, Duc-Thinh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136012496","display_name":"Nhut-Huy Pham","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pham, Nhut-Huy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136002649","display_name":"Ningli Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Ningli","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123958685","display_name":"Vu N. Duong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Duong, Vu N.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136027004","display_name":"Sameer Alam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alam, Sameer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11489","display_name":"Air Traffic Management and Optimization","score":0.271699994802475,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11489","display_name":"Air Traffic Management and Optimization","score":0.271699994802475,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.2371000051498413,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.12960000336170197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/air-traffic-control","display_name":"Air traffic control","score":0.7210000157356262},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6478000283241272},{"id":"https://openalex.org/keywords/runway","display_name":"Runway","score":0.5353000164031982},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.5019999742507935},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.47440001368522644},{"id":"https://openalex.org/keywords/air-traffic-management","display_name":"Air traffic management","score":0.46160000562667847},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.45879998803138733}],"concepts":[{"id":"https://openalex.org/C166961238","wikidata":"https://www.wikidata.org/wiki/Q221395","display_name":"Air traffic control","level":2,"score":0.7210000157356262},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6478000283241272},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6100000143051147},{"id":"https://openalex.org/C81155309","wikidata":"https://www.wikidata.org/wiki/Q184590","display_name":"Runway","level":2,"score":0.5353000164031982},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.5019999742507935},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C2776777543","wikidata":"https://www.wikidata.org/wiki/Q1361182","display_name":"Air traffic management","level":3,"score":0.46160000562667847},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.45879998803138733},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.4408000111579895},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.32910001277923584},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C506615639","wikidata":"https://www.wikidata.org/wiki/Q21662260","display_name":"Command and control","level":2,"score":0.3142000138759613},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30720001459121704},{"id":"https://openalex.org/C3017944768","wikidata":"https://www.wikidata.org/wiki/Q1450463","display_name":"Poison control","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.25940001010894775},{"id":"https://openalex.org/C527412718","wikidata":"https://www.wikidata.org/wiki/Q855395","display_name":"Interpretation (philosophy)","level":2,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.11769","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11769","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.11769","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.11769","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Air":[0],"Traffic":[1],"Control":[2],"(ATC)":[3],"is":[4,103],"a":[5,80],"safety-critical":[6],"domain":[7],"in":[8,31,133],"which":[9],"incorrect":[10,68],"interpretation":[11],"of":[12,63,150,158],"instructions":[13],"may":[14],"lead":[15],"to":[16,57,86],"severe":[17],"operational":[18,32,101],"consequences.":[19],"While":[20],"large":[21],"language":[22],"models":[23,119],"(LLMs)":[24],"demonstrate":[25],"strong":[26],"general":[27],"performance,":[28],"their":[29,100],"reliability":[30,102],"ATC":[33,87,160],"environments":[34],"remains":[35],"unclear.":[36],"Existing":[37],"evaluation":[38,83,152],"approaches,":[39],"largely":[40],"based":[41],"on":[42,107],"aggregate":[43,98],"metrics":[44],"such":[45],"as":[46],"F1":[47],"or":[48,71],"macro":[49],"accuracy,":[50,99],"treat":[51],"all":[52],"errors":[53,131],"uniformly":[54],"and":[55],"fail":[56],"account":[58],"for":[59,154],"the":[60,110,148,155],"asymmetric":[61],"consequences":[62],"high-risk":[64],"semantic":[65],"mistakes":[66],"(e.g.,":[67],"runway":[69],"identifiers":[70],"movement":[72],"constraints).":[73],"To":[74],"address":[75],"this":[76],"gap,":[77],"we":[78],"propose":[79],"safety-oriented,":[81],"consequence-aware":[82,151],"framework":[84],"tailored":[85],"operations.":[88],"Our":[89],"results":[90],"reveal":[91],"that":[92,130],"while":[93],"current":[94],"LLMs":[95],"achieve":[96],"reasonable":[97],"severely":[104],"limited.":[105],"Evaluated":[106],"clean":[108],"transcripts,":[109],"peak":[111],"Risk":[112],"Score":[113],"reaches":[114],"only":[115],"0.69,":[116],"with":[117],"most":[118],"scoring":[120],"below":[121],"0.6":[122],"despite":[123,136],"high":[124],"macro-F1":[125],"performance.":[126],"Further":[127],"analysis":[128],"shows":[129],"concentrate":[132],"high-impact":[134],"entities":[135],"relatively":[137],"stable":[138],"action-type":[139],"classification,":[140],"indicating":[141],"structural":[142],"grounding":[143],"deficiencies.":[144],"These":[145],"findings":[146],"highlight":[147],"necessity":[149],"protocols":[153],"responsible":[156],"deployment":[157],"AI-assisted":[159],"systems.":[161]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-14T00:00:00"}
