{"id":"https://openalex.org/W4412673519","doi":"https://doi.org/10.1145/3731120.3744624","title":"A Substring Extraction-Based RAG Method for Minimising Hallucinations in Aircraft Maintenance Question Answering","display_name":"A Substring Extraction-Based RAG Method for Minimising Hallucinations in Aircraft Maintenance Question Answering","publication_year":2025,"publication_date":"2025-07-18","ids":{"openalex":"https://openalex.org/W4412673519","doi":"https://doi.org/10.1145/3731120.3744624"},"language":"en","primary_location":{"id":"doi:10.1145/3731120.3744624","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731120.3744624","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International ACM SIGIR Conference on Innovative Concepts and Theories in Information Retrieval (ICTIR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119079165","display_name":"Quentin Sign\u00e9","orcid":null},"institutions":[{"id":"https://openalex.org/I112991645","display_name":"Airbus (France)","ror":"https://ror.org/023qdcg29","country_code":"FR","type":"company","lineage":["https://openalex.org/I112991645","https://openalex.org/I4210121748"]},{"id":"https://openalex.org/I134560555","display_name":"Universit\u00e9 Toulouse III - Paul Sabatier","ror":"https://ror.org/02v6kpv12","country_code":"FR","type":"education","lineage":["https://openalex.org/I134560555"]},{"id":"https://openalex.org/I3131550300","display_name":"Universit\u00e9 Toulouse-I-Capitole","ror":"https://ror.org/0443n9e75","country_code":"FR","type":"education","lineage":["https://openalex.org/I3131550300"]},{"id":"https://openalex.org/I4210119061","display_name":"Institut de Recherche en Informatique de Toulouse","ror":"https://ror.org/01rx4qw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210119061","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210152422","display_name":"Universit\u00e9 Toulouse - Jean Jaur\u00e8s","ror":"https://ror.org/04ezk3x31","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210152422","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210160189","display_name":"Institut Polytechnique de Bordeaux","ror":"https://ror.org/054qv7y42","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210160189"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Quentin Sign\u00e9","raw_affiliation_strings":["Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France and Airbus Protect, Blagnac, France"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France and Airbus Protect, Blagnac, France","institution_ids":["https://openalex.org/I4210152422","https://openalex.org/I134560555","https://openalex.org/I4210119061","https://openalex.org/I3131550300","https://openalex.org/I4210160189","https://openalex.org/I112991645"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052301458","display_name":"Mohand Boughanem","orcid":"https://orcid.org/0000-0001-7004-0807"},"institutions":[{"id":"https://openalex.org/I134560555","display_name":"Universit\u00e9 Toulouse III - Paul Sabatier","ror":"https://ror.org/02v6kpv12","country_code":"FR","type":"education","lineage":["https://openalex.org/I134560555"]},{"id":"https://openalex.org/I3131550300","display_name":"Universit\u00e9 Toulouse-I-Capitole","ror":"https://ror.org/0443n9e75","country_code":"FR","type":"education","lineage":["https://openalex.org/I3131550300"]},{"id":"https://openalex.org/I4210119061","display_name":"Institut de Recherche en Informatique de Toulouse","ror":"https://ror.org/01rx4qw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210119061","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210152422","display_name":"Universit\u00e9 Toulouse - Jean Jaur\u00e8s","ror":"https://ror.org/04ezk3x31","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210152422","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210160189","display_name":"Institut Polytechnique de Bordeaux","ror":"https://ror.org/054qv7y42","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210160189"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Mohand Boughanem","raw_affiliation_strings":["Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France","institution_ids":["https://openalex.org/I4210152422","https://openalex.org/I134560555","https://openalex.org/I4210119061","https://openalex.org/I3131550300","https://openalex.org/I4210160189"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027337246","display_name":"Jos\u00e9 G. Moreno","orcid":"https://orcid.org/0000-0002-8852-5797"},"institutions":[{"id":"https://openalex.org/I134560555","display_name":"Universit\u00e9 Toulouse III - Paul Sabatier","ror":"https://ror.org/02v6kpv12","country_code":"FR","type":"education","lineage":["https://openalex.org/I134560555"]},{"id":"https://openalex.org/I3131550300","display_name":"Universit\u00e9 Toulouse-I-Capitole","ror":"https://ror.org/0443n9e75","country_code":"FR","type":"education","lineage":["https://openalex.org/I3131550300"]},{"id":"https://openalex.org/I4210119061","display_name":"Institut de Recherche en Informatique de Toulouse","ror":"https://ror.org/01rx4qw44","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I205747304","https://openalex.org/I205747304","https://openalex.org/I4210119061","https://openalex.org/I4387153255","https://openalex.org/I4405258862","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210152422","display_name":"Universit\u00e9 Toulouse - Jean Jaur\u00e8s","ror":"https://ror.org/04ezk3x31","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210152422","https://openalex.org/I4405258862"]},{"id":"https://openalex.org/I4210160189","display_name":"Institut Polytechnique de Bordeaux","ror":"https://ror.org/054qv7y42","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210160189"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jose G. Moreno","raw_affiliation_strings":["Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Toulouse - IRIT UMR 5505, Toulouse, France","institution_ids":["https://openalex.org/I4210152422","https://openalex.org/I134560555","https://openalex.org/I4210119061","https://openalex.org/I3131550300","https://openalex.org/I4210160189"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077888210","display_name":"Thiziri Belkacem","orcid":"https://orcid.org/0000-0001-9454-0996"},"institutions":[{"id":"https://openalex.org/I112991645","display_name":"Airbus (France)","ror":"https://ror.org/023qdcg29","country_code":"FR","type":"company","lineage":["https://openalex.org/I112991645","https://openalex.org/I4210121748"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Thiziri Belkacem","raw_affiliation_strings":["Airbus Protect, Blagnac, France"],"affiliations":[{"raw_affiliation_string":"Airbus Protect, Blagnac, France","institution_ids":["https://openalex.org/I112991645"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5119079165"],"corresponding_institution_ids":["https://openalex.org/I112991645","https://openalex.org/I134560555","https://openalex.org/I3131550300","https://openalex.org/I4210119061","https://openalex.org/I4210152422","https://openalex.org/I4210160189"],"apc_list":null,"apc_paid":null,"fwci":7.0294,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.9664354,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"513","last_page":"521"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13018","display_name":"Seismology and Earthquake Studies","score":0.9404000043869019,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13832","display_name":"Advanced Decision-Making Techniques","score":0.9182999730110168,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substring","display_name":"Substring","score":0.861572265625},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6314844489097595},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5399520397186279},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.4575764834880829},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41129744052886963},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.32300108671188354},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10008639097213745},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.09241798520088196},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.07838311791419983},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.06605115532875061}],"concepts":[{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.861572265625},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6314844489097595},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5399520397186279},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.4575764834880829},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41129744052886963},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32300108671188354},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10008639097213745},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.09241798520088196},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.07838311791419983},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.06605115532875061}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3731120.3744624","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731120.3744624","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International ACM SIGIR Conference on Innovative Concepts and Theories in Information Retrieval (ICTIR)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-05298876v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05298876","pdf_url":null,"source":{"id":"https://openalex.org/S4406922461","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ICTIR '25: International ACM SIGIR Conference on Innovative Concepts and Theories in Information Retrieval, Jul 2025, Padua, Italy. pp.513-521, &#x27E8;10.1145/3731120.3744624&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2061141062","https://openalex.org/W3027879771","https://openalex.org/W3095789240","https://openalex.org/W4309674289","https://openalex.org/W4313209338","https://openalex.org/W4320165837","https://openalex.org/W4327644088","https://openalex.org/W4361866031","https://openalex.org/W4384652670","https://openalex.org/W4393152682","https://openalex.org/W4400528326","https://openalex.org/W4403347014","https://openalex.org/W4404534210","https://openalex.org/W4406297511","https://openalex.org/W4406650295","https://openalex.org/W6601899773","https://openalex.org/W6917613312","https://openalex.org/W7035904466"],"related_works":["https://openalex.org/W1583922594","https://openalex.org/W1974038726","https://openalex.org/W2998448420","https://openalex.org/W1598224733","https://openalex.org/W4280502676","https://openalex.org/W2000769876","https://openalex.org/W2112822946","https://openalex.org/W204227468","https://openalex.org/W2157233202","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Hallucination":[0],"occurs":[1],"when":[2],"a":[3,17,78,84],"language":[4],"model":[5],"generates":[6],"plausible":[7],"yet":[8],"nonfactual":[9],"information.":[10],"In":[11],"particular,":[12],"faithfulness":[13],"hallucinations":[14],"(inconsistency":[15],"with":[16],"given":[18],"context)":[19],"cannot":[20],"be":[21],"tolerated":[22],"in":[23,132],"critical":[24],"domains":[25],"such":[26],"as":[27,63],"aircraft":[28,98],"maintenance":[29,99],"due":[30],"to":[31,71,91,111],"the":[32,54,64,72,104,108,115,127],"potentially":[33],"severe":[34],"consequences.":[35],"To":[36],"mitigate":[37],"this":[38],"issue,":[39],"Retrieval":[40],"Augmented":[41],"Generation":[42],"(RAG)":[43],"methods":[44],"have":[45],"been":[46],"introduced.":[47],"These":[48],"approaches":[49],"are":[50,141],"relevant":[51],"for":[52],"reducing":[53],"risks":[55],"of":[56,107,129],"hallucination":[57,123],"but":[58],"do":[59],"not":[60],"eliminate":[61],"them,":[62],"generator":[65],"may":[66],"still":[67],"produce":[68],"content":[69],"unfaithful":[70],"retrieved":[73,89],"context.":[74],"This":[75,125],"paper":[76],"proposes":[77],"novel":[79],"RAG":[80,113],"approach":[81,117],"that":[82],"leverages":[83],"substring":[85],"extraction":[86],"tool":[87],"from":[88],"documents":[90],"minimise":[92],"hallucinations.":[93],"Experiments":[94],"performed":[95],"on":[96],"real":[97],"documentation":[100],"revealed":[101],"that,":[102],"despite":[103],"lower":[105],"accuracy":[106,138],"answers":[109],"compared":[110],"traditional":[112],"methods,":[114],"proposed":[116],"demonstrates":[118],"an":[119],"improved":[120],"control":[121],"over":[122],"risks.":[124],"highlights":[126],"potential":[128],"our":[130],"method":[131],"highly":[133],"technical":[134],"use":[135],"cases":[136],"where":[137],"and":[139],"reliability":[140],"key.":[142]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
