{"id":"https://openalex.org/W4306317054","doi":"https://doi.org/10.1145/3511808.3557366","title":"Intersection of Parallels as an Early Stopping Criterion","display_name":"Intersection of Parallels as an Early Stopping Criterion","publication_year":2022,"publication_date":"2022-10-16","ids":{"openalex":"https://openalex.org/W4306317054","doi":"https://doi.org/10.1145/3511808.3557366"},"language":"en","primary_location":{"id":"doi:10.1145/3511808.3557366","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3511808.3557366","pdf_url":null,"source":{"id":"https://openalex.org/S4363608762","display_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072883623","display_name":"Ali Vardasbi","orcid":"https://orcid.org/0000-0002-9342-5272"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]},{"id":"https://openalex.org/I4210135670","display_name":"Amsterdam University of the Arts","ror":"https://ror.org/04dde1554","country_code":"NL","type":"education","lineage":["https://openalex.org/I4210135670"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Ali Vardasbi","raw_affiliation_strings":["University of Amsterdam, Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amsterdam, Netherlands","institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031439294","display_name":"Maarten de Rijke","orcid":"https://orcid.org/0000-0002-1086-0202"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]},{"id":"https://openalex.org/I4210135670","display_name":"Amsterdam University of the Arts","ror":"https://ror.org/04dde1554","country_code":"NL","type":"education","lineage":["https://openalex.org/I4210135670"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Maarten de Rijke","raw_affiliation_strings":["University of Amsterdam, Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam, Amsterdam, Netherlands","institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102906366","display_name":"Mostafa Dehghani","orcid":"https://orcid.org/0000-0002-9772-1095"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mostafa Dehghani","raw_affiliation_strings":["Google Brain, Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Google Brain, Amsterdam, Netherlands","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072883623"],"corresponding_institution_ids":["https://openalex.org/I4210135670","https://openalex.org/I887064364"],"apc_list":null,"apc_paid":null,"fwci":0.2096,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.42802629,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1965","last_page":"1974"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.9034516215324402},{"id":"https://openalex.org/keywords/early-stopping","display_name":"Early stopping","score":0.8758722543716431},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6569426655769348},{"id":"https://openalex.org/keywords/disjoint-sets","display_name":"Disjoint sets","score":0.6235615611076355},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.5991136431694031},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5561032295227051},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5220046639442444},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.46656978130340576},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4259186089038849},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.39055711030960083},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3426729440689087},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2772965431213379},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2623744308948517}],"concepts":[{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.9034516215324402},{"id":"https://openalex.org/C5465570","wikidata":"https://www.wikidata.org/wiki/Q5326898","display_name":"Early stopping","level":3,"score":0.8758722543716431},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6569426655769348},{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.6235615611076355},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.5991136431694031},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5561032295227051},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5220046639442444},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.46656978130340576},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4259186089038849},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.39055711030960083},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3426729440689087},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2772965431213379},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2623744308948517},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3511808.3557366","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3511808.3557366","pdf_url":null,"source":{"id":"https://openalex.org/S4363608762","display_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},{"id":"pmh:oai:dare.uva.nl:openaire_cris_publications/10d627b7-78ce-4b52-af75-7e8d9a8dae90","is_oa":false,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/intersection-of-parallels-as-an-early-stopping-criterion(10d627b7-78ce-4b52-af75-7e8d9a8dae90).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Vardasbi, A, de Rijke, M & Dehghani, M 2022, Intersection of Parallels as an Early Stopping Criterion. in CIKM '22 : proceedings of the 31st ACM International Conference on Information & Knowledge Management : October 17-21, 2022, Atlanta, GA, USA. New York, NY, pp. 1965-1974, 31st ACM International Conference on Information and Knowledge Management, CIKM 2022, Atlanta, United States, 17/10/22. https://doi.org/10.1145/3511808.3557366","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:dare.uva.nl:publications/10d627b7-78ce-4b52-af75-7e8d9a8dae90","is_oa":false,"landing_page_url":"https://hdl.handle.net/11245.1/10d627b7-78ce-4b52-af75-7e8d9a8dae90","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Vardasbi, A, de Rijke, M & Dehghani, M 2022, Intersection of Parallels as an Early Stopping Criterion. in CIKM '22 : proceedings of the 31st ACM International Conference on Information & Knowledge Management : October 17-21, 2022, Atlanta, GA, USA. New York, NY, pp. 1965-1974, 31st ACM International Conference on Information and Knowledge Management, CIKM 2022, Atlanta, United States, 17/10/22. https://doi.org/10.1145/3511808.3557366","raw_type":"info:eu-repo/semantics/publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1576278180","https://openalex.org/W2014051179","https://openalex.org/W2034978228","https://openalex.org/W2065468017","https://openalex.org/W2071613752","https://openalex.org/W2108862644","https://openalex.org/W2507134384","https://openalex.org/W2784672094","https://openalex.org/W2911742574","https://openalex.org/W2963417959","https://openalex.org/W2963518130","https://openalex.org/W3025991882","https://openalex.org/W3200016735","https://openalex.org/W4230960434","https://openalex.org/W4287777768","https://openalex.org/W4288079518","https://openalex.org/W4288280739","https://openalex.org/W6747597888"],"related_works":["https://openalex.org/W4254751698","https://openalex.org/W2922073769","https://openalex.org/W4320854463","https://openalex.org/W3040157805","https://openalex.org/W4288022214","https://openalex.org/W4387799548","https://openalex.org/W4385768004","https://openalex.org/W3008105014","https://openalex.org/W1724442104","https://openalex.org/W2156876426"],"abstract_inverted_index":{"A":[0],"common":[1],"way":[2],"to":[3,23,104,142,153,174,179,213,228,264,298],"avoid":[4],"overfitting":[5,252],"in":[6,28,110,129,266,311],"supervised":[7],"learning":[8,257,263,289],"is":[9,16,57,65,71,205],"early":[10,107,245],"stopping,":[11],"where":[12],"a":[13,25,40,43,86,102,122,138,159,172,203,206,254,285],"held-out":[14],"set":[15,56,88],"used":[17,274],"for":[18,61,95,121,221,282],"iterative":[19],"evaluation":[20],"during":[21,146,194],"training":[22,32,55,69,76,112,195],"find":[24],"sweet":[26],"spot":[27,105],"the":[29,50,54,75,80,83,111,119,130,133,143,184,188,191,199,232,277,305,315],"number":[30],"of":[31,49,82,114,137,158,190,202,209,235,253,279,288,314],"steps":[33],"that":[34,128,198,244,307],"gives":[35],"maximum":[36],"generalization.":[37,96,283],"However,":[38],"such":[39],"method":[41,103,281],"requires":[42],"disjoint":[44],"validation":[45,87,123],"set,":[46],"thus":[47],"part":[48],"labeled":[51],"data":[52,70],"from":[53,258],"usually":[58],"left":[59],"out":[60],"this":[62,98,149],"purpose,":[63],"which":[64],"not":[66,90],"ideal":[67],"when":[68,74],"scarce.":[72],"Furthermore,":[73],"labels":[77],"are":[78],"noisy,":[79],"performance":[81],"model":[84,140],"over":[85],"may":[89],"be":[91],"an":[92,106,115,226],"accurate":[93],"proxy":[94],"In":[97,177],"paper,":[99],"we":[100,151,182,216,308],"propose":[101,152,225],"stopping":[108,246],"point":[109],"iterations":[113],"overparameterized":[116,131],"(NN)":[117],"without":[118],"need":[120],"set.":[124],"We":[125,238],"first":[126],"show":[127],"regime":[132],"randomly":[134],"initialized":[135,162],"weights":[136,189],"linear":[139,160,207,222],"converge":[141],"same":[144],"direction":[145],"training.":[147],"Using":[148],"result,":[150],"train":[154],"two":[155,242],"parallel":[156,192],"instances":[157],"model,":[161],"with":[163],"different":[164],"random":[165],"seeds,":[166],"and":[167,224,261],"use":[168,183],"their":[169],"intersection":[170],"as":[171],"signal":[173],"detect":[175,180],"overfitting.":[176],"order":[178],"intersection,":[181],"cosine":[185],"distance":[186],"between":[187],"models":[193,223],"iterations.":[196],"Noticing":[197],"final":[200],"layer":[201,211],"NN":[204],"map":[208],"pre-last":[210],"activations":[212],"output":[214],"logits,":[215],"build":[217],"on":[218,241,250,271,301],"our":[219,280,291],"criterion":[220],"extension":[227],"multi-layer":[229],"networks,":[230],"using":[231],"new":[233],"notion":[234],"counterfactual":[236],"weights.":[237],"conduct":[239],"experiments":[240,270],"areas":[243],"has":[247],"noticeable":[248],"impact":[249],"preventing":[251],"NN:":[255],"(i)":[256],"noisy":[259],"labels;":[260],"(ii)":[262],"rank":[265],"information":[267],"retrieval.":[268],"Our":[269],"four":[272],"widely":[273],"datasets":[275],"confirm":[276],"effectiveness":[278],"For":[284],"wide":[286],"range":[287],"rates,":[290],"method,":[292],"called":[293],"Cosine-Distance":[294],"Criterion":[295],"(CDC),":[296],"leads":[297],"better":[299],"generalization":[300],"average":[302],"than":[303],"all":[304,313],"methods":[306],"compare":[309],"against":[310],"almost":[312],"tested":[316],"cases.":[317]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-17T09:09:15.849793","created_date":"2025-10-10T00:00:00"}
