{"id":"https://openalex.org/W4416429642","doi":"https://doi.org/10.1109/iccad66269.2025.11240877","title":"QuickFlow: An Efficient Local Search Method to Map Convolutions on Spatial Architectures","display_name":"QuickFlow: An Efficient Local Search Method to Map Convolutions on Spatial Architectures","publication_year":2025,"publication_date":"2025-10-26","ids":{"openalex":"https://openalex.org/W4416429642","doi":"https://doi.org/10.1109/iccad66269.2025.11240877"},"language":"en","primary_location":{"id":"doi:10.1109/iccad66269.2025.11240877","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240877","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://re.public.polimi.it/bitstream/11311/1308828/1/QuickFlow_An_Efficient_Local_Search_Method_to_Map_Convolutions_on_Spatial_Architectures.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116500165","display_name":"Marco Ronzani","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Marco Ronzani","raw_affiliation_strings":["DEIB, Politecnico di Milano,Italy"],"affiliations":[{"raw_affiliation_string":"DEIB, Politecnico di Milano,Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031461662","display_name":"Cristina Silvano","orcid":"https://orcid.org/0000-0003-1668-0883"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Cristina Silvano","raw_affiliation_strings":["DEIB, Politecnico di Milano,Italy"],"affiliations":[{"raw_affiliation_string":"DEIB, Politecnico di Milano,Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5116500165"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37326002,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7918999791145325,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.7918999791145325,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.07440000027418137,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.01590000092983246,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.6919999718666077},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4896000027656555},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.45829999446868896},{"id":"https://openalex.org/keywords/memory-hierarchy","display_name":"Memory hierarchy","score":0.4562000036239624},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.43529999256134033},{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.4311000108718872},{"id":"https://openalex.org/keywords/data-mapping","display_name":"Data mapping","score":0.4187000095844269},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.3781000077724457}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8363999724388123},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.6919999718666077},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4896000027656555},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4691999852657318},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.4562000036239624},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.43529999256134033},{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.4311000108718872},{"id":"https://openalex.org/C137314826","wikidata":"https://www.wikidata.org/wiki/Q2330408","display_name":"Data mapping","level":2,"score":0.4187000095844269},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3781000077724457},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3643999993801117},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.32690000534057617},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.32580000162124634},{"id":"https://openalex.org/C2776221188","wikidata":"https://www.wikidata.org/wiki/Q21072556","display_name":"Design space exploration","level":2,"score":0.31369999051094055},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.3086000084877014},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3003000020980835},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C184596265","wikidata":"https://www.wikidata.org/wiki/Q2651576","display_name":"Model of computation","level":3,"score":0.288100004196167},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.28040000796318054},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.25850000977516174},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2556999921798706},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iccad66269.2025.11240877","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccad66269.2025.11240877","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/ACM International Conference On Computer Aided Design (ICCAD)","raw_type":"proceedings-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1308828","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1308828","pdf_url":"https://re.public.polimi.it/bitstream/11311/1308828/1/QuickFlow_An_Efficient_Local_Search_Method_to_Map_Convolutions_on_Spatial_Architectures.pdf","source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:re.public.polimi.it:11311/1308828","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1308828","pdf_url":"https://re.public.polimi.it/bitstream/11311/1308828/1/QuickFlow_An_Efficient_Local_Search_Method_to_Map_Convolutions_on_Spatial_Architectures.pdf","source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416429642.pdf","grobid_xml":"https://content.openalex.org/works/W4416429642.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W2268122618","https://openalex.org/W2332901121","https://openalex.org/W2395611524","https://openalex.org/W2906043559","https://openalex.org/W2940862705","https://openalex.org/W2949967139","https://openalex.org/W2953212265","https://openalex.org/W2980104813","https://openalex.org/W2980200167","https://openalex.org/W2982083293","https://openalex.org/W2997929983","https://openalex.org/W2998732502","https://openalex.org/W3101026687","https://openalex.org/W3132942233","https://openalex.org/W3173351640","https://openalex.org/W3174280965","https://openalex.org/W3190062760","https://openalex.org/W3192336523","https://openalex.org/W3217256060","https://openalex.org/W4286300805","https://openalex.org/W4360831984","https://openalex.org/W4383501739","https://openalex.org/W4389491911","https://openalex.org/W4407319928","https://openalex.org/W4408151313","https://openalex.org/W4409568286"],"related_works":[],"abstract_inverted_index":{"Efficiently":[0],"running":[1],"deep":[2],"neural":[3],"networks":[4],"requires":[5],"the":[6,56,77,169,242],"hardware":[7,67,125],"acceleration":[8],"of":[9,58,161],"convolutional":[10],"kernels.":[11,148],"Spatial":[12],"Architectures":[13],"(SAs)":[14],"are":[15],"a":[16,24,38,135,158,189,210,228],"natural":[17],"fit,":[18],"employing":[19],"multiple":[20],"processing":[21],"elements":[22],"and":[23,31,44,61,124,146,175,223,233],"custom":[25],"memory":[26],"hierarchy":[27],"to":[28,40,54,105,116,185,194,235,241],"exploit":[29],"parallelism":[30,176],"data":[32,42,163],"reuse.":[33],"In":[34,149],"turn,":[35],"SAs":[36,145,222],"require":[37],"mapping":[39,49,78,91,137,248],"specify":[41],"movements":[43],"computation":[45],"order.":[46],"Thus,":[47],"specialized":[48],"tools":[50],"have":[51],"been":[52],"developed":[53],"explore":[55],"space":[57,79,127],"possible":[59],"mappings":[60,111,143,155],"retrieve":[62],"optimal":[63],"ones,":[64],"using":[65],"analytical":[66,204],"models":[68],"for":[69,73,100,144,214],"performance":[70,84],"feedback.":[71],"However,":[72],"each":[74],"SA-kernel":[75],"pair,":[76],"is":[80],"vast,":[81],"with":[82],"significant":[83],"variations":[85],"arising":[86],"from":[87,245],"subtle":[88],"interactions":[89],"between":[90,154],"decisions.":[92],"Therefore,":[93],"coordinating":[94],"all":[95],"problem":[96],"aspects":[97],"remains":[98],"challenging":[99],"existing":[101],"tools,":[102],"often":[103],"leading":[104],"long":[106],"execution":[107,238],"times.":[108],"Yet,":[109],"high-quality":[110],"must":[112],"be":[113],"promptly":[114],"available":[115],"support":[117],"downstream":[118],"tasks,":[119],"like":[120],"runtime":[121],"resource":[122],"allocation":[123],"design":[126],"exploration.":[128],"To":[129],"address":[130],"this,":[131],"we":[132,151,167],"propose":[133],"QuickFlow,":[134,150],"new":[136],"tool":[138],"that":[139],"efficiently":[140],"finds":[141],"near-optimal":[142,197],"AI":[147],"build":[152],"equivalences":[153],"based":[156],"on":[157,220],"detailed":[159],"analysis":[160],"distinct":[162],"reuse":[164],"opportunities.":[165],"Then,":[166],"redesign":[168],"optimization":[170],"paradigm":[171],"accordingly,":[172],"comparing":[173],"tiling":[174],"decisions":[177],"after":[178],"quickly":[179],"selecting":[180],"their":[181],"best":[182,243],"dataflow":[183],"up":[184,234],"equivalence,":[186],"ultimately":[187],"enabling":[188],"single":[190],"greedy":[191],"local":[192],"search":[193],"effectively":[195],"reach":[196],"mappings.":[198],"QuickFlow":[199,226],"also":[200],"integrates":[201],"an":[202],"improved":[203],"model,":[205],"supporting":[206],"arbitrary":[207],"convolutions":[208],"through":[209],"novel,":[211],"exact":[212],"formula":[213],"tile":[215],"sizes.":[216],"Across":[217],"our":[218],"experiments":[219],"three":[221],"twenty":[224],"kernels,":[225],"achieves":[227],"1\u20132.1\u00d7":[229],"better":[230],"energy-delay":[231],"product":[232],"182\u00d7":[236],"faster":[237],"time":[239],"compared":[240],"results":[244],"four":[246],"state-of-the-art":[247],"tools.":[249]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-11-20T00:00:00"}
