{"id":"https://openalex.org/W4408403680","doi":"https://doi.org/10.1145/3677389.3702522","title":"Exploring Efficient Optimization Techniques in Online Retrieval-Augmented Generation Application","display_name":"Exploring Efficient Optimization Techniques in Online Retrieval-Augmented Generation Application","publication_year":2024,"publication_date":"2024-12-16","ids":{"openalex":"https://openalex.org/W4408403680","doi":"https://doi.org/10.1145/3677389.3702522"},"language":"en","primary_location":{"id":"doi:10.1145/3677389.3702522","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3677389.3702522","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM/IEEE Joint Conference on Digital Libraries","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100722415","display_name":"Yining Zhang","orcid":"https://orcid.org/0009-0006-2107-5855"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yining Zhang","raw_affiliation_strings":["Peking University, Beijing, China","School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-2107-5855","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yinan Peng","orcid":"https://orcid.org/0009-0008-2653-2992"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinan Peng","raw_affiliation_strings":["School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-2653-2992","affiliations":[{"raw_affiliation_string":"School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057927581","display_name":"C.W. Tu","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengying Tu","raw_affiliation_strings":["School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-0604-8816","affiliations":[{"raw_affiliation_string":"School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zherui Zhang","orcid":"https://orcid.org/0009-0008-0150-715X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zherui Zhang","raw_affiliation_strings":["School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-0150-715X","affiliations":[{"raw_affiliation_string":"School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111726041","display_name":"Hongfei Yan","orcid":"https://orcid.org/0000-0001-5914-8585"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongfei Yan","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-5914-8585","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113913281","display_name":"Chong Chen","orcid":"https://orcid.org/0000-0002-9704-1575"},"institutions":[{"id":"https://openalex.org/I4210105365","display_name":"Qujing Normal University","ror":"https://ror.org/02ad7ap24","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210105365"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chong Chen","raw_affiliation_strings":["Bejing Normal University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9704-1575","affiliations":[{"raw_affiliation_string":"Bejing Normal University, Beijing, China","institution_ids":["https://openalex.org/I4210105365"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hao Ma","orcid":"https://orcid.org/0009-0007-8075-9584"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Ma","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0007-8075-9584","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100516224","display_name":"Jia Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Yang","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-1216-2871","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yan Zhang","orcid":"https://orcid.org/0009-0008-8103-7978"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Zhang","raw_affiliation_strings":["Peking University, Beijing, China","School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-8103-7978","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029343996","display_name":"Rikun Liao","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rikun Liao","raw_affiliation_strings":["Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0000-5403-2874","affiliations":[{"raw_affiliation_string":"Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2187,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.56137338,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9623000025749207,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9556000232696533,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7942221164703369},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.44915810227394104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3442688286304474}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7942221164703369},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.44915810227394104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3442688286304474}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3677389.3702522","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3677389.3702522","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM/IEEE Joint Conference on Digital Libraries","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W2963469388","https://openalex.org/W3027879771"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,47,85,102,111],"large":[3],"language":[4],"models":[5],"(LLM)":[6],"have":[7,52],"brought":[8],"an":[9],"explosive":[10],"growth":[11],"to":[12,23,58,90,180],"chat-bot":[13],"applications.":[14,195],"Among":[15],"them,":[16],"retrieval-augmented":[17],"generation,":[18],"which":[19,69,134],"provides":[20],"extra":[21,66],"context":[22],"make":[24],"LLM":[25,67,123,194],"capable":[26],"of":[27,39,56,63,105,155],"answering":[28],"out-of-domain":[29],"questions":[30],"is":[31,70],"becoming":[32],"a":[33,54,99,106,118],"popular":[34],"method.":[35],"However,":[36],"naive":[37],"implementation":[38],"RAG":[40,86],"usually":[41],"cannot":[42],"reach":[43],"ideal":[44],"answer":[45,140,182],"quality":[46,92],"complicated":[48],"real-world":[49,193],"scenarios.":[50],"Researchers":[51],"proposed":[53],"number":[55],"methods":[57],"improve":[59,88],"RAG,":[60],"but":[61],"many":[62],"them":[64],"involves":[65],"calls":[68],"too":[71],"time-consuming":[72],"for":[73,124,163,190],"online":[74],"application.":[75],"In":[76],"this":[77],"paper,":[78],"we":[79],"explored":[80],"practical":[81],"techniques":[82],"and":[83,142,157,168,186],"designs":[84],"that":[87],"answers":[89],"user-satisfying":[91],"while":[93],"keeping":[94],"the":[95,103,138,144,153,160],"response":[96],"latency":[97],"at":[98],"moderate":[100],"level":[101],"scenario":[104],"research":[107],"data":[108],"QA":[109],"application":[110],"university.":[112],"Our":[113,184],"main":[114],"findings":[115],"include":[116],"introducing":[117],"relevance":[119],"judge":[120],"with":[121],"small-scale":[122],"retrieved":[125],"documents":[126],"can":[127,135,151],"effectively":[128],"filter":[129],"out":[130],"less":[131],"relevant":[132],"ones,":[133],"otherwise":[136],"disrupt":[137],"generated":[139],"greatly,":[141],"decomposing":[143],"generation":[145],"task":[146],"into":[147],"multiple":[148],"independent":[149],"sub-tasks":[150],"reduce":[152],"chance":[154],"hallucination":[156],"also":[158],"accelerates":[159],"generation.":[161],"As":[162],"model":[164],"performance,":[165],"prompt":[166],"engineering":[167],"fine-tuning":[169],"(through":[170],"learning":[171],"from":[172],"strong":[173],"LLM)":[174],"are":[175],"effective":[176],"yet":[177],"simple":[178],"ways":[179],"enhance":[181],"quality.":[183],"results":[185],"experience":[187],"provide":[188],"insights":[189],"building":[191],"future":[192]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
