{"id":"https://openalex.org/W4408605330","doi":"https://doi.org/10.1088/2632-2153/adc2d6","title":"ChemLit-QA: a human evaluated dataset for chemistry RAG tasks","display_name":"ChemLit-QA: a human evaluated dataset for chemistry RAG tasks","publication_year":2025,"publication_date":"2025-03-19","ids":{"openalex":"https://openalex.org/W4408605330","doi":"https://doi.org/10.1088/2632-2153/adc2d6"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/adc2d6","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/adc2d6","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1088/2632-2153/adc2d6","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012917895","display_name":"Geemi P. Wellawatte","orcid":"https://orcid.org/0000-0002-3772-6927"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Geemi P Wellawatte","raw_affiliation_strings":["Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-3772-6927","affiliations":[{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053485585","display_name":"Huixuan Guo","orcid":"https://orcid.org/0000-0002-2289-8945"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH","SG"],"is_corresponding":false,"raw_author_name":"Huixuan Guo","raw_affiliation_strings":["Department of Chemical and Biomolecular Engineering, Nanyang Technological University (NTU), Singapore, Singapore","Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-2289-8945","affiliations":[{"raw_affiliation_string":"Department of Chemical and Biomolecular Engineering, Nanyang Technological University (NTU), Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114987474","display_name":"Magdalena Lederbauer","orcid":"https://orcid.org/0009-0008-0665-1839"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Magdalena Lederbauer","raw_affiliation_strings":["Department of Chemistry and Applied Biosciences, ETH, Zurich, Switzerland","Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0009-0008-0665-1839","affiliations":[{"raw_affiliation_string":"Department of Chemistry and Applied Biosciences, ETH, Zurich, Switzerland","institution_ids":["https://openalex.org/I35440088"]},{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013456318","display_name":"Anna S. Borisova","orcid":"https://orcid.org/0000-0002-3414-9888"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Anna Borisova","raw_affiliation_strings":["Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046339281","display_name":"Matthew J. Hart","orcid":"https://orcid.org/0000-0002-2683-480X"},"institutions":[{"id":"https://openalex.org/I1333535994","display_name":"University of North Carolina Health Care","ror":"https://ror.org/00qz24g20","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1333535994"]},{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH","US"],"is_corresponding":false,"raw_author_name":"Matthew Hart","raw_affiliation_strings":["Department of Applied Physical Sciences, UNC, Chapel Hill, NC, United States of America","Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Applied Physical Sciences, UNC, Chapel Hill, NC, United States of America","institution_ids":["https://openalex.org/I1333535994"]},{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116695426","display_name":"Marta Brucka","orcid":null},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Marta Brucka","raw_affiliation_strings":["Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028051805","display_name":"Philippe Schwaller","orcid":"https://orcid.org/0000-0003-3046-6576"},"institutions":[{"id":"https://openalex.org/I5124864","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I5124864"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Philippe Schwaller","raw_affiliation_strings":["Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland"],"raw_orcid":"https://orcid.org/0000-0003-3046-6576","affiliations":[{"raw_affiliation_string":"Institute of Chemical Sciences and Engineering, Ecole Polytechnique F\u00e9d\u00e9rale de Lausanne (EPFL), Laboratory of Artificial Chemical Intelligence (LIAC), Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]},{"raw_affiliation_string":"National Centre of Competence in Research (NCCR) Catalysis, EPFL, Lausanne, Switzerland","institution_ids":["https://openalex.org/I5124864"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":1.1519,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.76016691,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"6","issue":"2","first_page":"020601","last_page":"020601"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.8476999998092651,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.8476999998092651,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12327","display_name":"Various Chemistry Research Topics","score":0.8403000235557556,"subfield":{"id":"https://openalex.org/subfields/1606","display_name":"Physical and Theoretical Chemistry"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10211","display_name":"Computational Drug Discovery Methods","score":0.7426999807357788,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4537633955478668},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.39736688137054443},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3698410391807556},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.33632680773735046},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32709813117980957},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.16447925567626953}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4537633955478668},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.39736688137054443},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3698410391807556},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.33632680773735046},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32709813117980957},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.16447925567626953}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1088/2632-2153/adc2d6","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/adc2d6","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:03423ff5d36440c88c2860b621f84fc8","is_oa":true,"landing_page_url":"https://doaj.org/article/03423ff5d36440c88c2860b621f84fc8","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning: Science and Technology, Vol 6, Iss 2, p 020601 (2025)","raw_type":"article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/207123","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/207123","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/adc2d6","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/adc2d6","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2159126771","display_name":null,"funder_award_id":"225147","funder_id":"https://openalex.org/F8269005443","funder_display_name":"NCCR Catalysis"}],"funders":[{"id":"https://openalex.org/F4320320915","display_name":"\u00c9cole Polytechnique F\u00e9d\u00e9rale de Lausanne","ror":"https://ror.org/02s376052"},{"id":"https://openalex.org/F8269005443","display_name":"NCCR Catalysis","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W2889787757","https://openalex.org/W2963026768","https://openalex.org/W2963123047","https://openalex.org/W2963748441","https://openalex.org/W3034383590","https://openalex.org/W3155807546","https://openalex.org/W3172205429","https://openalex.org/W4285999563","https://openalex.org/W4309674289","https://openalex.org/W4327550249","https://openalex.org/W4365211638","https://openalex.org/W4380995299","https://openalex.org/W4383346782","https://openalex.org/W4389761608","https://openalex.org/W4389991792","https://openalex.org/W4391221150","https://openalex.org/W4391561379","https://openalex.org/W4391846075","https://openalex.org/W4392822465","https://openalex.org/W4396723768","https://openalex.org/W4399442007","https://openalex.org/W4399803256","https://openalex.org/W4401248262","https://openalex.org/W4403420914","https://openalex.org/W4406779522","https://openalex.org/W6767102903","https://openalex.org/W6777615688","https://openalex.org/W6778883912","https://openalex.org/W6794800773","https://openalex.org/W6809646742","https://openalex.org/W6838540236","https://openalex.org/W6853859572","https://openalex.org/W6854866820","https://openalex.org/W6855664720","https://openalex.org/W6856802482","https://openalex.org/W6858023062","https://openalex.org/W6859201984","https://openalex.org/W6861152682","https://openalex.org/W6861717473","https://openalex.org/W6861740999","https://openalex.org/W6862478885","https://openalex.org/W6863620578","https://openalex.org/W6865177968","https://openalex.org/W6866540064","https://openalex.org/W6869570532","https://openalex.org/W6872286008","https://openalex.org/W6877457025"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W2948807893","https://openalex.org/W2899084033","https://openalex.org/W2778153218","https://openalex.org/W2748952813","https://openalex.org/W1531601525","https://openalex.org/W4391375266","https://openalex.org/W2078814861","https://openalex.org/W2527526854","https://openalex.org/W1976181487"],"abstract_inverted_index":{"Abstract":[0],"Retrieval-Augmented":[1],"Generation":[2],"(RAG)":[3],"is":[4,22,37],"a":[5,83,97,119],"widely":[6],"used":[7],"strategy":[8],"in":[9,26,47,61],"Large-Language":[10],"Models":[11],"(LLMs)":[12],"to":[13,64,91],"extrapolate":[14],"beyond":[15],"the":[16,48,65,113,159],"inherent":[17],"pre-trained":[18],"knowledge.":[19],"Hence,":[20],"RAG":[21,35],"crucial":[23],"when":[24,76],"working":[25],"data-sparse":[27],"fields":[28],"such":[29],"as":[30],"Chemistry.":[31],"The":[32],"evaluation":[33,133],"of":[34,50,68,118],"systems":[36],"commonly":[38],"conducted":[39],"using":[40,122],"specialized":[41],"datasets.":[42],"However,":[43],"existing":[44],"datasets,":[45],"typically":[46],"form":[49],"scientific":[51,92],"Question-Answer-Context":[52],"(QAC)":[53],"triplets":[54],"or":[55,71],"QA":[56],"pairs,":[57],"are":[58],"often":[59],"limited":[60],"size":[62],"due":[63],"labor-intensive":[66],"nature":[67],"manual":[69],"curation":[70],"require":[72],"further":[73],"quality":[74],"assessment":[75],"generated":[77],"through":[78],"automated":[79,124],"processes.":[80],"This":[81],"highlights":[82],"critical":[84],"need":[85],"for":[86,108,155],"large,":[87],"high-quality":[88],"datasets":[89],"tailored":[90],"applications.":[93],"We":[94],"introduce":[95],"ChemLit-QA,":[96],"comprehensive,":[98],"expert-validated,":[99],"open-source":[100],"dataset":[101,121,161],"comprising":[102],"over":[103],"1,000":[104],"entries":[105],"specifically":[106],"designed":[107],"chemistry.":[109],"Our":[110],"approach":[111],"involves":[112],"initial":[114],"generation":[115],"and":[116,148,165],"filtering":[117],"QAC":[120],"an":[123],"framework":[125],"based":[126],"on":[127,145,151,162],"GPT-4":[128],"Turbo,":[129],"followed":[130],"by":[131,134],"rigorous":[132],"chemistry":[135],"experts.":[136],"Additionally,":[137],"we":[138],"provide":[139],"two":[140],"supplementary":[141],"datasets:":[142],"ChemLit-QA-neg":[143],"focused":[144,150],"negative":[146],"data,":[147],"ChemLit-QA-multi":[149],"multihop":[152],"reasoning":[153],"tasks":[154],"LLMs,":[156],"which":[157],"complement":[158],"main":[160],"hallucination":[163],"detection":[164],"more":[166],"reasoning-intensive":[167],"tasks.":[168]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
