{"id":"https://openalex.org/W7087266786","doi":"https://doi.org/10.18420/inf2025_105","title":"Best Practices in AI and Data Science Models Evaluation","display_name":"Best Practices in AI and Data Science Models Evaluation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7087266786","doi":"https://doi.org/10.18420/inf2025_105"},"language":"en","primary_location":{"id":"pmh:oai:pure.leuphana.de:openaire_cris_publications/f31e3aed-334e-45eb-8f9e-b5a36f0778b7","is_oa":true,"landing_page_url":"http://fis.leuphana.de/de/publications/best-practices-in-ai-and-data-science-models-evaluation(f31e3aed-334e-45eb-8f9e-b5a36f0778b7).html","pdf_url":"https://dl.gi.de/bitstreams/9d5b7a50-3901-406f-b9d4-2eb405f5fbcf/download","source":{"id":"https://openalex.org/S4306400489","display_name":"Multilingual Matters (Channel View Publications)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Banerjee, D, Taffa, T A & Usbeck, R 2025, Best Practices in AI and Data Science Models Evaluation. in U Lucke, S Stieglitz, F Uebernickel, A-L Lamprecht & M Klein (eds), INFORMATIK 2025 : The Wide Open - Offenheit von Source bis Science, 16.-19.September 2025 Potsdam. Lecture Notes in Informatics (LNI), Proceedings - Series of the Gesellschaft fur Informatik (GI), Gesellschaft f\u00fcr Informatik e.V., Bonn, pp. 1211-1219. https://doi.org/10.18420/inf2025_105","raw_type":"info:eu-repo/semantics/publishedVersion"},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://dl.gi.de/bitstreams/9d5b7a50-3901-406f-b9d4-2eb405f5fbcf/download","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Banerjee, Debayan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Banerjee, Debayan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Taffa, Tilahun Abedissa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taffa, Tilahun Abedissa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Usbeck, Ricardo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Usbeck, Ricardo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65162442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10261","display_name":"Genetic Associations and Epidemiology","score":0.7688999772071838,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10261","display_name":"Genetic Associations and Epidemiology","score":0.7688999772071838,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.06870000064373016,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11213","display_name":"Genomic variations and chromosomal abnormalities","score":0.03370000049471855,"subfield":{"id":"https://openalex.org/subfields/1311","display_name":"Genetics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/best-practice","display_name":"Best practice","score":0.794700026512146},{"id":"https://openalex.org/keywords/trustworthiness","display_name":"Trustworthiness","score":0.6399000287055969},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.517300009727478},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.3625999987125397},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.3483000099658966},{"id":"https://openalex.org/keywords/health-care","display_name":"Health care","score":0.34220001101493835},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.30709999799728394}],"concepts":[{"id":"https://openalex.org/C184356942","wikidata":"https://www.wikidata.org/wiki/Q830382","display_name":"Best practice","level":2,"score":0.794700026512146},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6413000226020813},{"id":"https://openalex.org/C153701036","wikidata":"https://www.wikidata.org/wiki/Q659974","display_name":"Trustworthiness","level":2,"score":0.6399000287055969},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.6144999861717224},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.517300009727478},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.36550000309944153},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3625999987125397},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.34929999709129333},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3483000099658966},{"id":"https://openalex.org/C160735492","wikidata":"https://www.wikidata.org/wiki/Q31207","display_name":"Health care","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3237000107765198},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.30709999799728394},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3005000054836273},{"id":"https://openalex.org/C2767350","wikidata":"https://www.wikidata.org/wiki/Q6662173","display_name":"Business intelligence","level":2,"score":0.290800005197525},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.2856999933719635},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2752000093460083},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C157170001","wikidata":"https://www.wikidata.org/wiki/Q4781507","display_name":"Applications of artificial intelligence","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.258899986743927},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.2551000118255615},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:pure.leuphana.de:openaire_cris_publications/f31e3aed-334e-45eb-8f9e-b5a36f0778b7","is_oa":true,"landing_page_url":"http://fis.leuphana.de/de/publications/best-practices-in-ai-and-data-science-models-evaluation(f31e3aed-334e-45eb-8f9e-b5a36f0778b7).html","pdf_url":"https://dl.gi.de/bitstreams/9d5b7a50-3901-406f-b9d4-2eb405f5fbcf/download","source":{"id":"https://openalex.org/S4306400489","display_name":"Multilingual Matters (Channel View Publications)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Banerjee, D, Taffa, T A & Usbeck, R 2025, Best Practices in AI and Data Science Models Evaluation. in U Lucke, S Stieglitz, F Uebernickel, A-L Lamprecht & M Klein (eds), INFORMATIK 2025 : The Wide Open - Offenheit von Source bis Science, 16.-19.September 2025 Potsdam. Lecture Notes in Informatics (LNI), Proceedings - Series of the Gesellschaft fur Informatik (GI), Gesellschaft f\u00fcr Informatik e.V., Bonn, pp. 1211-1219. https://doi.org/10.18420/inf2025_105","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.leuphana.de:publications/f31e3aed-334e-45eb-8f9e-b5a36f0778b7","is_oa":false,"landing_page_url":"http://fox.leuphana.de/portal/de/publications/best-practices-in-ai-and-data-science-models-evaluation(f31e3aed-334e-45eb-8f9e-b5a36f0778b7).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400489","display_name":"Multilingual Matters (Channel View Publications)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Banerjee, D, Taffa, T A & Usbeck, R 2025, Best Practices in AI and Data Science Models Evaluation. in U Lucke, S Stieglitz, F Uebernickel, A-L Lamprecht & M Klein (eds), INFORMATIK 2025 : The Wide Open - Offenheit von Source bis Science, 16.-19.September 2025 Potsdam. Lecture Notes in Informatics (LNI), Proceedings - Series of the Gesellschaft fur Informatik (GI), Gesellschaft f\u00fcr Informatik e.V., Bonn, pp. 1211-1219. https://doi.org/10.18420/inf2025_105","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"doi:10.18420/inf2025_105","is_oa":true,"landing_page_url":"https://doi.org/10.18420/inf2025_105","pdf_url":null,"source":{"id":"https://openalex.org/S7407052918","display_name":"Gesellschaft f\u00fcr Informatik (GI)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:pure.leuphana.de:openaire_cris_publications/f31e3aed-334e-45eb-8f9e-b5a36f0778b7","is_oa":true,"landing_page_url":"http://fis.leuphana.de/de/publications/best-practices-in-ai-and-data-science-models-evaluation(f31e3aed-334e-45eb-8f9e-b5a36f0778b7).html","pdf_url":"https://dl.gi.de/bitstreams/9d5b7a50-3901-406f-b9d4-2eb405f5fbcf/download","source":{"id":"https://openalex.org/S4306400489","display_name":"Multilingual Matters (Channel View Publications)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Banerjee, D, Taffa, T A & Usbeck, R 2025, Best Practices in AI and Data Science Models Evaluation. in U Lucke, S Stieglitz, F Uebernickel, A-L Lamprecht & M Klein (eds), INFORMATIK 2025 : The Wide Open - Offenheit von Source bis Science, 16.-19.September 2025 Potsdam. Lecture Notes in Informatics (LNI), Proceedings - Series of the Gesellschaft fur Informatik (GI), Gesellschaft f\u00fcr Informatik e.V., Bonn, pp. 1211-1219. https://doi.org/10.18420/inf2025_105","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2761004381","display_name":null,"funder_award_id":"460234259","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G6052429835","display_name":null,"funder_award_id":"(DFG)","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"}],"funders":[{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W7087266786.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Evaluating":[0],"Artificial":[1],"Intelligence":[2],"(AI)":[3],"and":[4,15,53,62,86,93,111],"data":[5,55],"science":[6],"models":[7,76],"is":[8],"crucial":[9],"to":[10,103],"ensure":[11],"their":[12],"reliability,":[13],"fairness,":[14],"applicability":[16],"in":[17,67],"real-world":[18],"scenarios.":[19],"This":[20],"paper":[21],"highlights":[22],"best":[23],"practices":[24,92],"for":[25,51],"model":[26],"evaluation,":[27],"emphasizing":[28],"the":[29,98],"importance":[30],"of":[31],"selecting":[32],"appropriate":[33],"metrics":[34],"aligned":[35],"with":[36],"business":[37],"or":[38,72,80],"research":[39],"goals.":[40],"Key":[41],"considerations":[42],"include":[43],"using":[44],"robust":[45],"validation":[46],"strategies":[47],"(e.g.,":[48],"cross-validation),":[49],"monitoring":[50],"overfitting,":[52],"ensuring":[54],"splits":[56],"preserve":[57],"class":[58],"distributions.":[59],"Fairness,":[60],"interpretability,":[61],"reproducibility":[63],"are":[64],"essential,":[65],"particularly":[66],"high-stakes":[68],"domains":[69],"like":[70],"healthcare":[71],"finance.":[73],"Additionally,":[74],"evaluating":[75],"across":[77],"multiple":[78],"datasets":[79],"demographic":[81],"subgroups":[82],"helps":[83],"uncover":[84],"biases":[85],"improve":[87],"generalizability.":[88],"Adopting":[89],"standardized":[90],"reporting":[91],"open-source":[94],"benchmarks":[95],"further":[96],"strengthens":[97],"evaluation":[99],"process.":[100],"By":[101],"adhering":[102],"these":[104],"practices,":[105],"practitioners":[106],"can":[107],"build":[108],"more":[109],"trustworthy":[110],"effective":[112],"AI":[113],"systems":[114]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-11T00:00:00"}
