{"id":"https://openalex.org/W2475602767","doi":"https://doi.org/10.25080/majora-8b375195-004","title":"SkData: Data Sets and Algorithm Evaluation Protocols in Python","display_name":"SkData: Data Sets and Algorithm Evaluation Protocols in Python","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W2475602767","doi":"https://doi.org/10.25080/majora-8b375195-004","mag":"2475602767"},"language":"en","primary_location":{"id":"doi:10.25080/majora-8b375195-004","is_oa":true,"landing_page_url":"https://doi.org/10.25080/majora-8b375195-004","pdf_url":"http://conference.scipy.org/proceedings/scipy2013/pdfs/bergstra_skdata.pdf","source":{"id":"https://openalex.org/S4220651651","display_name":"Proceedings of the Python in Science Conferences","issn_l":"2575-9752","issn":["2575-9752"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Python in Science Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"http://conference.scipy.org/proceedings/scipy2013/pdfs/bergstra_skdata.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057264590","display_name":"James Bergstra","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"James Bergstra","raw_affiliation_strings":["University of Waterloo"],"affiliations":[{"raw_affiliation_string":"University of Waterloo","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111928952","display_name":"Nicolas Pinto","orcid":null},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nicolas Pinto","raw_affiliation_strings":["Massachusetts Institute of Technology  Harvard University","Massachusetts Institute of Technology \u00b6 Harvard University"],"affiliations":[{"raw_affiliation_string":"Massachusetts Institute of Technology  Harvard University","institution_ids":["https://openalex.org/I2801851002","https://openalex.org/I63966007"]},{"raw_affiliation_string":"Massachusetts Institute of Technology \u00b6 Harvard University","institution_ids":["https://openalex.org/I136199984","https://openalex.org/I63966007"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101624980","display_name":"D. J. Cox","orcid":"https://orcid.org/0009-0008-1944-4337"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Cox","raw_affiliation_strings":["http://www.youtube.com/watch?v=u5amehIiImo"],"affiliations":[{"raw_affiliation_string":"http://www.youtube.com/watch?v=u5amehIiImo","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5057264590"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":93,"citation_normalized_percentile":{"value":0.24865662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"20","last_page":"26"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13650","display_name":"Computational Physics and Python Applications","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/python","display_name":"Python (programming language)","score":0.8291298151016235},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8280967473983765},{"id":"https://openalex.org/keywords/upload","display_name":"Upload","score":0.6862055659294128},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6337363719940186},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6145622730255127},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.5783193111419678},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.48115694522857666},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4323316216468811},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4320456087589264},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.4125773012638092},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3998304307460785},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.35384148359298706},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3291638493537903},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3130646347999573},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.1505376398563385}],"concepts":[{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.8291298151016235},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8280967473983765},{"id":"https://openalex.org/C71901391","wikidata":"https://www.wikidata.org/wiki/Q7126699","display_name":"Upload","level":2,"score":0.6862055659294128},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6337363719940186},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6145622730255127},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.5783193111419678},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.48115694522857666},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4323316216468811},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4320456087589264},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.4125773012638092},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3998304307460785},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.35384148359298706},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3291638493537903},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3130646347999573},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.1505376398563385},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.25080/majora-8b375195-004","is_oa":true,"landing_page_url":"https://doi.org/10.25080/majora-8b375195-004","pdf_url":"http://conference.scipy.org/proceedings/scipy2013/pdfs/bergstra_skdata.pdf","source":{"id":"https://openalex.org/S4220651651","display_name":"Proceedings of the Python in Science Conferences","issn_l":"2575-9752","issn":["2575-9752"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Python in Science Conference","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.25080/majora-8b375195-004","is_oa":true,"landing_page_url":"https://doi.org/10.25080/majora-8b375195-004","pdf_url":"http://conference.scipy.org/proceedings/scipy2013/pdfs/bergstra_skdata.pdf","source":{"id":"https://openalex.org/S4220651651","display_name":"Proceedings of the Python in Science Conferences","issn_l":"2575-9752","issn":["2575-9752"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Python in Science Conference","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.44999998807907104,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G756852635","display_name":"RI:  Medium:  Collaborative Research:  Unlocking Biologically-Inspired Computer Vision: A High-Throughput Approach","funder_award_id":"0963668","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G813443333","display_name":null,"funder_award_id":"IIS 0963668","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320332916","display_name":"Rowland Institute at Harvard","ror":"https://ror.org/03eta9142"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2475602767.pdf","grobid_xml":"https://content.openalex.org/works/W2475602767.grobid-xml"},"referenced_works_count":5,"referenced_works":["https://openalex.org/W1554944419","https://openalex.org/W1782590233","https://openalex.org/W2101234009","https://openalex.org/W2171033594","https://openalex.org/W3118608800"],"related_works":["https://openalex.org/W3023169329","https://openalex.org/W4389470870","https://openalex.org/W2782165897","https://openalex.org/W1582950852","https://openalex.org/W4300438041","https://openalex.org/W2054104202","https://openalex.org/W2139703748","https://openalex.org/W2761254753","https://openalex.org/W1024825291","https://openalex.org/W2188981919"],"abstract_inverted_index":{"Machine":[0],"learning":[1],"benchmark":[2,74],"data":[3,51,75,89],"sets":[4,76,90],"come":[5],"in":[6],"all":[7,35],"shapes":[8],"and":[9,26,32,78,87,101,113,128],"sizes,":[10],"whereas":[11],"classification":[12],"algorithms":[13],"assume":[14],"sanitized":[15],"input,":[16],"such":[17],"as":[18],"(x,":[19],"y)":[20],"pairs":[21],"with":[22,94,120],"vector-valued":[23],"input":[24],"x":[25],"integer":[27],"class":[28],"label":[29],"y.":[30],"Researchers":[31],"practitioners":[33],"know":[34],"too":[36],"well":[37],"how":[38],"tedious":[39],"it":[40],"can":[41,91],"be":[42,92],"to":[43,53],"get":[44],"from":[45],"the":[46,126,131],"URL":[47],"of":[48,73,111,130],"a":[49,54,70],"new":[50],"set":[52],"NumPy":[55],"ndarray":[56],"suitable":[57],"for":[58,69,85],"e.g.":[59],"pandas":[60],"or":[61],"sklearn.":[62],"The":[63,103],"SkData":[64,104,132],"library":[65,95,105],"handles":[66],"that":[67,81,97,116],"work":[68],"growing":[71],"number":[72],"(small":[77],"large)":[79],"so":[80],"one-off":[82],"in-house":[83],"scripts":[84],"downloading":[86],"parsing":[88],"replaced":[93],"code":[96],"is":[98],"reliable,":[99],"community-tested,":[100],"documented.":[102],"also":[106],"introduces":[107],"an":[108],"open-ended":[109],"formalization":[110],"training":[112],"testing":[114],"protocols":[115],"facilitates":[117],"direct":[118],"comparison":[119],"published":[121],"research.":[122],"This":[123],"paper":[124],"describes":[125],"usage":[127],"architecture":[129],"library.":[133]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":24},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":13},{"year":2022,"cited_by_count":17},{"year":2021,"cited_by_count":12},{"year":2020,"cited_by_count":4}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
