{"id":"https://openalex.org/W4403487010","doi":"https://doi.org/10.3233/faia240837","title":"RETRO-LI: Small-Scale Retrieval Augmented Generation Supporting Noisy Similarity Searches and Domain Shift Generalization","display_name":"RETRO-LI: Small-Scale Retrieval Augmented Generation Supporting Noisy Similarity Searches and Domain Shift Generalization","publication_year":2024,"publication_date":"2024-10-16","ids":{"openalex":"https://openalex.org/W4403487010","doi":"https://doi.org/10.3233/faia240837"},"language":"en","primary_location":{"id":"doi:10.3233/faia240837","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240837","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240837","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240837","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093073513","display_name":"Gentiana Rashiti","orcid":null},"institutions":[{"id":"https://openalex.org/I4210126328","display_name":"IBM Research - Zurich","ror":"https://ror.org/02js37d36","country_code":"CH","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126328"]},{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Gentiana Rashiti","raw_affiliation_strings":["ETH Z\u00fcrich","IBM Research \u2013 Zurich"],"affiliations":[{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]},{"raw_affiliation_string":"IBM Research \u2013 Zurich","institution_ids":["https://openalex.org/I4210126328"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043163538","display_name":"Geethan Karunaratne","orcid":"https://orcid.org/0000-0002-0805-4789"},"institutions":[{"id":"https://openalex.org/I4210126328","display_name":"IBM Research - Zurich","ror":"https://ror.org/02js37d36","country_code":"CH","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126328"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Geethan Karunaratne","raw_affiliation_strings":["IBM Research \u2013 Zurich"],"affiliations":[{"raw_affiliation_string":"IBM Research \u2013 Zurich","institution_ids":["https://openalex.org/I4210126328"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002316432","display_name":"Mrinmaya Sachan","orcid":"https://orcid.org/0000-0001-8787-8681"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Mrinmaya Sachan","raw_affiliation_strings":["ETH Z\u00fcrich"],"affiliations":[{"raw_affiliation_string":"ETH Z\u00fcrich","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017236774","display_name":"Abu Sebastian","orcid":"https://orcid.org/0000-0001-5603-5243"},"institutions":[{"id":"https://openalex.org/I4210126328","display_name":"IBM Research - Zurich","ror":"https://ror.org/02js37d36","country_code":"CH","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126328"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Abu Sebastian","raw_affiliation_strings":["IBM Research \u2013 Zurich"],"affiliations":[{"raw_affiliation_string":"IBM Research \u2013 Zurich","institution_ids":["https://openalex.org/I4210126328"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050167359","display_name":"Abbas Rahimi","orcid":"https://orcid.org/0000-0003-3141-4970"},"institutions":[{"id":"https://openalex.org/I4210126328","display_name":"IBM Research - Zurich","ror":"https://ror.org/02js37d36","country_code":"CH","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210126328"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Abbas Rahimi","raw_affiliation_strings":["IBM Research \u2013 Zurich"],"affiliations":[{"raw_affiliation_string":"IBM Research \u2013 Zurich","institution_ids":["https://openalex.org/I4210126328"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5093073513"],"corresponding_institution_ids":["https://openalex.org/I35440088","https://openalex.org/I4210126328"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38605781,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9833999872207642,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9666000008583069,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7190356254577637},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6480222940444946},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5836210250854492},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5545873045921326},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5334976315498352},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.44228360056877136},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42573416233062744},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2223457396030426},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1670810878276825},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.07927876710891724}],"concepts":[{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7190356254577637},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6480222940444946},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5836210250854492},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5545873045921326},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5334976315498352},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.44228360056877136},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42573416233062744},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2223457396030426},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1670810878276825},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.07927876710891724},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/faia240837","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240837","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240837","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},{"id":"pmh:oai:arXiv.org:2410.00004","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2410.00004","pdf_url":"https://arxiv.org/pdf/2410.00004","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.3233/faia240837","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia240837","pdf_url":"https://ebooks.iospress.nl/pdf/doi/10.3233/FAIA240837","source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7300000190734863,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G7880511466","display_name":null,"funder_award_id":"200800","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G8079057867","display_name":"Etudes en vue de la synth\u00e8se totale de la Roflamy- coine.","funder_award_id":"20080","funder_id":"https://openalex.org/F4320320924","funder_display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320320924","display_name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","ror":"https://ror.org/00yjd3n13"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4403487010.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3162204513","https://openalex.org/W2371138613","https://openalex.org/W2048963458","https://openalex.org/W43109613","https://openalex.org/W2359952343","https://openalex.org/W2239445980","https://openalex.org/W2080152487","https://openalex.org/W3083152911","https://openalex.org/W2967006609","https://openalex.org/W2327130486"],"abstract_inverted_index":{"The":[0],"retrieval":[1,39],"augmented":[2],"generation":[3],"(RAG)":[4],"system":[5],"such":[6],"as":[7],"RETRO":[8],"has":[9],"been":[10],"shown":[11],"to":[12,82],"improve":[13],"language":[14],"modeling":[15],"capabilities":[16],"and":[17,20,53,103],"reduce":[18],"toxicity":[19],"hallucinations":[21],"by":[22,69],"retrieving":[23,137],"from":[24],"a":[25,44,59,71,80,108],"database":[26],"of":[27,32],"non-parametric":[28,63,84,118],"memory":[29,85,119],"containing":[30],"trillions":[31],"entries.":[33],"We":[34,76,112],"introduce":[35],"RETRO-LI":[36],"that":[37,115],"shows":[38],"can":[40,66,120],"also":[41,113],"help":[42],"using":[43,70],"small":[45],"scale":[46],"database,":[47],"but":[48],"it":[49,90,104],"demands":[50],"more":[51],"accurate":[52],"better":[54],"neighbors":[55],"when":[56,94,107],"searching":[57],"in":[58,136],"smaller":[60],"hence":[61],"sparser":[62],"memory.":[64],"This":[65],"be":[67,122],"met":[68],"proper":[72],"semantic":[73],"similarity":[74],"search.":[75],"further":[77],"propose":[78],"adding":[79],"regularization":[81],"the":[83,87,95,116],"for":[86],"first":[88],"time:":[89],"significantly":[91],"reduces":[92],"perplexity":[93],"neighbor":[96],"search":[97,131],"operations":[98],"are":[99],"noisy":[100],"during":[101],"inference,":[102],"improves":[105],"generalization":[106],"domain":[109],"shift":[110],"occurs.":[111],"show":[114],"RETRO-LI\u2019s":[117],"potentially":[121],"implemented":[123],"on":[124],"analog":[125],"in-memory":[126],"computing":[127],"hardware,":[128],"exhibiting":[129],"O(1)":[130],"time":[132],"while":[133],"causing":[134],"noise":[135],"neighbors,":[138],"with":[139],"minimal":[140],"(&lt;1%)":[141],"performance":[142],"loss.":[143],"Our":[144],"code":[145],"is":[146],"available":[147],"at:":[148],"https://github.com/IBM/Retrieval-Enhanced-Transformer-Little":[149]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
