{"id":"https://openalex.org/W4392402551","doi":"https://doi.org/10.5220/0012379800003660","title":"Scale Learning in Scale-Equivariant Convolutional Networks","display_name":"Scale Learning in Scale-Equivariant Convolutional Networks","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4392402551","doi":"https://doi.org/10.5220/0012379800003660"},"language":"en","primary_location":{"id":"doi:10.5220/0012379800003660","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0012379800003660","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.5220/0012379800003660","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094056125","display_name":"Mark Basting","orcid":null},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Mark Basting","raw_affiliation_strings":["Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052695749","display_name":"Robert-Jan Bruintjes","orcid":"https://orcid.org/0000-0002-9798-0214"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Robert-Jan Bruintjes","raw_affiliation_strings":["Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054652375","display_name":"Thadd\u00e4us Wiedemer","orcid":"https://orcid.org/0009-0003-6280-0804"},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]},{"id":"https://openalex.org/I4210135521","display_name":"Max Planck Institute for Intelligent Systems","ror":"https://ror.org/04fq9j139","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Thadd\u00e4us Wiedemer","raw_affiliation_strings":["Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---","Machine Learning, Max-Planck-Institute for Intelligent Systems, Max-Planck-Ring, T\u00fcbingen, Germany, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---","institution_ids":["https://openalex.org/I8087733"]},{"raw_affiliation_string":"Machine Learning, Max-Planck-Institute for Intelligent Systems, Max-Planck-Ring, T\u00fcbingen, Germany, --- Select a Country ---","institution_ids":["https://openalex.org/I4210135521"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068221391","display_name":"Matthias K\u00fcmmerer","orcid":"https://orcid.org/0000-0001-9644-4703"},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias K\u00fcmmerer","raw_affiliation_strings":["Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---","institution_ids":["https://openalex.org/I8087733"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061457780","display_name":"Matthias Bethge","orcid":"https://orcid.org/0000-0002-6417-7812"},"institutions":[{"id":"https://openalex.org/I8087733","display_name":"University of T\u00fcbingen","ror":"https://ror.org/03a1kwz48","country_code":"DE","type":"education","lineage":["https://openalex.org/I8087733"]},{"id":"https://openalex.org/I4401726832","display_name":"T\u00fcbingen AI Center","ror":"https://ror.org/0107nyd78","country_code":null,"type":"education","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210135521","https://openalex.org/I4401726832","https://openalex.org/I8087733"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Matthias Bethge","raw_affiliation_strings":["Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---","T\u00fcbingen AI Center, Maria-von-Linden-Stra\u00dfe, T\u00fcbingen, Germany, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Bethgelab, University of T\u00fcbingen, Geschwister-Scholl-Platz, T\u00fcbingen, Germany, --- Select a Country ---","institution_ids":["https://openalex.org/I8087733"]},{"raw_affiliation_string":"T\u00fcbingen AI Center, Maria-von-Linden-Stra\u00dfe, T\u00fcbingen, Germany, --- Select a Country ---","institution_ids":["https://openalex.org/I4401726832"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077258803","display_name":"Jan van Gemert","orcid":"https://orcid.org/0000-0002-3913-2786"},"institutions":[{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Jan van Gemert","raw_affiliation_strings":["Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Lab, Delft University of Technology, The Netherlands, --- Select a Country ---","institution_ids":["https://openalex.org/I98358874"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5094056125"],"corresponding_institution_ids":["https://openalex.org/I98358874"],"apc_list":null,"apc_paid":null,"fwci":0.9379,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.7749593,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"567","last_page":"574"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9366999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9366999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.7402061223983765},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6651487350463867},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4085954427719116},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.1291283667087555},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.08342880010604858}],"concepts":[{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.7402061223983765},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6651487350463867},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4085954427719116},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.1291283667087555},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.08342880010604858}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.5220/0012379800003660","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0012379800003660","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},{"id":"pmh:oai:tudelft.nl:uuid:72821daa-2034-4ac8-aabb-b03e0c4404c3","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:72821daa-2034-4ac8-aabb-b03e0c4404c3","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"master thesis"}],"best_oa_location":{"id":"doi:10.5220/0012379800003660","is_oa":true,"landing_page_url":"https://doi.org/10.5220/0012379800003660","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th International Joint Conference on Computer Vision, Imaging and Computer Graphics Theory and Applications","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"In":[0,120],"real-life":[1],"scenarios,":[2],"there":[3],"are":[4,18,45,135],"many":[5],"variations":[6],"in":[7,31,40,115,163],"sizes":[8],"of":[9,11,38,61,77,87,110,127,159,247],"objects":[10,17,32],"the":[12,16,27,41,62,90,103,107,116,129,150,166,181,195,198,204,210,214,224,231,234,241,245,248,250,262,274,296],"same":[13,63],"category":[14],"and":[15,51,223,236,270,287],"not":[19,170,179],"always":[20],"placed":[21],"at":[22,131],"a":[23,75,125,185],"fixed":[24,79,186],"distance":[25],"from":[26],"camera.":[28],"This":[29],"results":[30],"taking":[33],"up":[34],"an":[35],"arbitrary":[36],"size":[37],"pixels":[39],"image.":[42],"Vanilla":[43],"CNNs":[44],"by":[46,213],"design":[47],"only":[48],"translation":[49],"equivariant":[50,253],"thus":[52],"have":[53,68],"to":[54,84,100,149,173,194,220,290],"learn":[55,244,261],"separate":[56],"filters":[57],"for":[58,137,154,200],"scaled":[59],"variants":[60],"objects.":[64,141],"Recently,":[65],"scale-equivariant":[66,175,293],"approaches":[67,294],"been":[69],"developed":[70],"that":[71,229,257],"share":[72],"features":[73,130],"across":[74],"set":[76,86,187],"pre-determined":[78],"scales.":[80,92],"We":[81,208,255],"further":[82],"refer":[83,219],"this":[85,121],"scales":[88,105,134,148,153,183,212,249,264,276],"as":[89,184,221],"internal":[91,104,133,147,152,182,211,263,275],"Existing":[93],"work":[94],"gives":[95],"little":[96],"information":[97],"about":[98,203],"how":[99,128],"best":[101],"choose":[102],"when":[106],"underlying":[108],"distribution":[109,158,168],"sizes,":[111],"or":[112],"scale":[113,157,167,206,216,268,284],"distribution,":[114],"dataset,":[117],"is":[118,169,252],"known.":[119,171],"work,":[122],"we":[123,177,218,243,281],"develop":[124],"model":[126,144,251],"different":[132,155],"used":[136],"samples":[138],"containing":[139],"differently-sized":[140],"The":[142],"proposed":[143],"return":[145],"comparable":[146],"best-performing":[151],"data":[156,205,267],"various":[160,266],"width.":[161],"However,":[162],"most":[164],"cases,":[165],"Compared":[172],"previous":[174],"methods,":[176],"do":[178],"treat":[180],"but":[188],"directly":[189],"optimise":[190],"them":[191],"with":[192],"regard":[193],"loss,":[196],"removing":[197],"need":[199],"prior":[201],"knowledge":[202],"distribution.":[207],"parameterise":[209],"smallest":[215,235],"which":[217],"\u03c3basis,":[222],"Internal":[225],"Scale":[226],"Range":[227],"(ISR)":[228],"models":[230],"ratio":[232],"between":[233],"largest":[237],"scale.":[238],"By":[239],"varying":[240],"ISR,":[242],"range":[246],"to.":[254],"show":[256],"our":[258,283],"method":[259],"can":[260,271],"on":[265,295],"distributions":[269],"better":[272],"adapt":[273],"than":[277],"other":[278,288],"parameterisations.":[279],"Finally,":[280],"compare":[282],"learning":[285],"approach":[286],"parameterisations":[289],"current":[291],"State-of-the-art":[292],"MNIST-Scale":[297],"dataset.":[298]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-28T09:10:13.091523","created_date":"2025-10-10T00:00:00"}
