{"id":"https://openalex.org/W4283073619","doi":"https://doi.org/10.48550/arxiv.2206.07137","title":"Prioritized Training on Points that are Learnable, Worth Learning, and Not Yet Learnt","display_name":"Prioritized Training on Points that are Learnable, Worth Learning, and Not Yet Learnt","publication_year":2022,"publication_date":"2022-06-14","ids":{"openalex":"https://openalex.org/W4283073619","doi":"https://doi.org/10.48550/arxiv.2206.07137"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2206.07137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.07137","pdf_url":"https://arxiv.org/pdf/2206.07137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2206.07137","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012960540","display_name":"S\u00f6ren Mindermann","orcid":"https://orcid.org/0000-0002-0315-9821"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Mindermann, S\u00f6ren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030437398","display_name":"Jan Brauner","orcid":"https://orcid.org/0000-0002-1588-5724"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Brauner, Jan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021091772","display_name":"Muhammed Razzak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Razzak, Muhammed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003223014","display_name":"Mrinank Sharma","orcid":"https://orcid.org/0000-0002-4304-7963"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Mrinank","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091107812","display_name":"Andreas Kirsch","orcid":"https://orcid.org/0000-0003-3578-7504"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kirsch, Andreas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028046389","display_name":"Winnie Xu","orcid":"https://orcid.org/0000-0002-5810-0851"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Winnie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018259549","display_name":"Benedikt H\u00f6ltgen","orcid":"https://orcid.org/0009-0008-0882-9821"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"H\u00f6ltgen, Benedikt","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079288315","display_name":"Aidan N. Gomez","orcid":"https://orcid.org/0000-0001-5601-5437"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gomez, Aidan N.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029898181","display_name":"Adrien Morisot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Morisot, Adrien","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051690066","display_name":"Sebastian Farquhar","orcid":"https://orcid.org/0000-0002-9185-6415"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farquhar, Sebastian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5029186201","display_name":"Yarin Gal","orcid":"https://orcid.org/0000-0002-2733-2078"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gal, Yarin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5012960540"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":19,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9789000153541565,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7492997646331787},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6143002510070801},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5904628038406372},{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.5773203372955322},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5231068134307861},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4911458194255829},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4875742793083191},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.44332388043403625},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4315151870250702},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12657126784324646}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7492997646331787},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6143002510070801},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5904628038406372},{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.5773203372955322},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5231068134307861},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4911458194255829},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4875742793083191},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.44332388043403625},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4315151870250702},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12657126784324646},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2206.07137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.07137","pdf_url":"https://arxiv.org/pdf/2206.07137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2206.07137","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2206.07137","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2206.07137","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2206.07137","pdf_url":"https://arxiv.org/pdf/2206.07137","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2140186469","https://openalex.org/W4390421286","https://openalex.org/W4280563792","https://openalex.org/W4389724018","https://openalex.org/W4318719684","https://openalex.org/W3183136280","https://openalex.org/W4318559728","https://openalex.org/W2775233965","https://openalex.org/W4360995913","https://openalex.org/W4312193868"],"abstract_inverted_index":{"Training":[0],"on":[1,14,103,135],"web-scale":[2],"data":[3,64,169],"can":[4],"take":[5],"months.":[6],"But":[7],"most":[8,49],"computation":[9],"and":[10,16,116,131,142,146,161],"time":[11],"is":[12],"wasted":[13],"redundant":[15],"noisy":[17,84],"points":[18,45,81,98,110],"that":[19,48,111],"are":[20,82,112],"already":[21],"learnt":[22],"or":[23,87],"not":[24,100,117],"learnable.":[25],"To":[26],"accelerate":[27],"training,":[28],"we":[29],"introduce":[30],"Reducible":[31],"Holdout":[32],"Loss":[33],"Selection":[34],"(RHO-LOSS),":[35],"a":[36,56,136],"simple":[37],"but":[38,79,96],"principled":[39],"technique":[40],"which":[41],"selects":[42,109],"approximately":[43],"those":[44],"for":[46],"training":[47,134],"reduce":[50],"the":[51,60,69,149],"model's":[52],"generalization":[53],"loss.":[54],"As":[55],"result,":[57],"RHO-LOSS":[58,108,120,155],"mitigates":[59],"weaknesses":[61],"of":[62,139],"existing":[63],"selection":[65],"methods:":[66],"techniques":[67],"from":[68],"optimization":[70],"literature":[71],"typically":[72],"select":[73],"'hard'":[74],"(e.g.":[75],"high":[76],"loss)":[77],"points,":[78,95],"such":[80,97],"often":[83],"(not":[85],"learnable)":[86],"less":[88],"task-relevant.":[89],"Conversely,":[90],"curriculum":[91],"learning":[92],"prioritizes":[93],"'easy'":[94],"need":[99],"be":[101],"trained":[102],"once":[104],"learned.":[105],"In":[106],"contrast,":[107],"learnable,":[113],"worth":[114],"learning,":[115],"yet":[118],"learnt.":[119],"trains":[121,156],"in":[122,157],"far":[123],"fewer":[124,159],"steps":[125,160],"than":[126,167],"prior":[127],"art,":[128],"improves":[129],"accuracy,":[130],"speeds":[132],"up":[133],"wide":[137],"range":[138],"datasets,":[140],"hyperparameters,":[141],"architectures":[143],"(MLPs,":[144],"CNNs,":[145],"BERT).":[147],"On":[148],"large":[150],"web-scraped":[151],"image":[152],"dataset":[153],"Clothing-1M,":[154],"18x":[158],"reaches":[162],"2%":[163],"higher":[164],"final":[165],"accuracy":[166],"uniform":[168],"shuffling.":[170]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":2}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2022-06-19T00:00:00"}
