{"id":"https://openalex.org/W7140789122","doi":"https://doi.org/10.1109/fpl68686.2025.00053","title":"Accelerating K-Means: A Vectorized Approach for AI Engines &amp; Neural Processing Units","display_name":"Accelerating K-Means: A Vectorized Approach for AI Engines &amp; Neural Processing Units","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W7140789122","doi":"https://doi.org/10.1109/fpl68686.2025.00053"},"language":"en","primary_location":{"id":"doi:10.1109/fpl68686.2025.00053","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fpl68686.2025.00053","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 35th International Conference on Field-Programmable Logic and Applications (FPL)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/11311/1311651","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119281754","display_name":"Eleonora Cabai","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Eleonora Cabai","raw_affiliation_strings":["Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103099232","display_name":"Giuseppe Sorrentino","orcid":"https://orcid.org/0009-0009-3025-8620"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Giuseppe Sorrentino","raw_affiliation_strings":["Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010543929","display_name":"Marco D. Santambrogio","orcid":"https://orcid.org/0000-0002-9883-9693"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marco Domenico Santambrogio","raw_affiliation_strings":["Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031247318","display_name":"Davide Conficconi","orcid":"https://orcid.org/0000-0002-5834-0812"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Davide Conficconi","raw_affiliation_strings":["Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano"],"affiliations":[{"raw_affiliation_string":"Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB), Politecnico di Milano","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5119281754"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.74570642,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"337","last_page":"341"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.13619999587535858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.13619999587535858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.06729999929666519,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.0502999983727932,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48100000619888306},{"id":"https://openalex.org/keywords/data-processing","display_name":"Data processing","score":0.31850001215934753},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.3043000102043152},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.2919999957084656},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.24779999256134033}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6128000020980835},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48100000619888306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4758000075817108},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3043000102043152},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.2919999957084656},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2838999927043915},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.24779999256134033},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.24230000376701355},{"id":"https://openalex.org/C199639397","wikidata":"https://www.wikidata.org/wiki/Q1788588","display_name":"Engineering drawing","level":1,"score":0.2410999983549118}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/fpl68686.2025.00053","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fpl68686.2025.00053","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 35th International Conference on Field-Programmable Logic and Applications (FPL)","raw_type":"proceedings-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1311651","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1311651","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:re.public.polimi.it:11311/1311651","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1311651","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W1977556410","https://openalex.org/W1983524036","https://openalex.org/W1997217298","https://openalex.org/W2019397928","https://openalex.org/W2122522028","https://openalex.org/W2135364554","https://openalex.org/W2150593711","https://openalex.org/W2733722625","https://openalex.org/W2771678286","https://openalex.org/W2890810933","https://openalex.org/W2901151390","https://openalex.org/W3003753408","https://openalex.org/W3193144889","https://openalex.org/W3197264354","https://openalex.org/W3209173547","https://openalex.org/W4401018115","https://openalex.org/W4406014947","https://openalex.org/W4410810368","https://openalex.org/W4411725362"],"related_works":[],"abstract_inverted_index":{"K-Means":[0,110,141,159],"is":[1,37],"a":[2,106,145],"clustering":[3],"technique":[4],"widely":[5],"employed":[6],"in":[7],"AI":[8,64,122,151,181],"workloads,":[9],"from":[10],"image":[11],"processing":[12],"to":[13,57,93,102,131,143,199],"data":[14,133,166],"mining.":[15],"Given":[16],"its":[17],"importance,":[18],"researchers":[19],"propose":[20,144],"different":[21,140],"algorithms":[22],"and":[23,69,128,174,179],"hardware-accelerated":[24],"implementations.":[25],"While":[26],"algorithm":[27,126,147],"suitability":[28],"can":[29,53],"depend":[30],"on":[31,160,208],"the":[32,42,46,51,58,83,103,117,170,180,193],"target":[33,59],"use":[34,60],"case,":[35],"there":[36],"much":[38],"less":[39],"doubt":[40],"about":[41],"architecture:":[43],"FPGAs":[44,164],"are":[45,74,98,121],"de":[47],"facto":[48],"standard,":[49],"as":[50,67,169],"design":[52,186],"be":[54],"perfectly":[55],"tailored":[56],"case.":[61],"Despite":[62],"this,":[63],"accelerators":[65],"such":[66],"GPUs":[68,209],"Neural":[70],"Processing":[71],"Units":[72],"(NPUs)":[73],"gaining":[75],"traction.":[76],"The":[77,89],"former":[78],"attains":[79],"remarkable":[80],"performance":[81],"at":[82],"cost":[84],"of":[85,105,177,189],"low":[86],"energy":[87,215],"efficiency.":[88],"latter,":[90],"instead,":[91],"promises":[92],"maximize":[94],"both,":[95],"but":[96,213],"they":[97],"strongly":[99],"underutilized":[100],"due":[101],"lack":[104],"clear":[107],"approach":[108],"for":[109,115,165,183],"acceleration.":[111],"Considering":[112],"AMD":[113],"NPU,":[114],"example,":[116],"main":[118],"computing":[119],"cores":[120],"Engines":[123,173],"that":[124,148],"require":[125],"reshaping":[127],"code":[129],"optimization":[130],"harness":[132],"parallelism":[134],"effectively.":[135],"Thus,":[136],"this":[137],"research":[138],"analyzes":[139],"versions":[142],"vectorized":[146,158],"fully":[149],"uses":[150],"Engine":[152,182],"(AIE)":[153],"features.":[154],"We":[155,196],"validate":[156],"our":[157],"Versal":[161],"VCK5000,":[162],"using":[163],"movement":[167],"only,":[168],"Memory":[171],"Transfer":[172],"Shim":[175],"Tiles":[176],"NPUs,":[178,191],"computation.":[184],"This":[185],"reflects":[187],"features":[188],"modern":[190],"making":[192],"validation":[194],"fair.":[195],"attain":[197],"up":[198],"<tex":[200],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[201],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$59.5":[202],"\\times$</tex>":[203],"speedup":[204],"against":[205],"Torch":[206],"library":[207],"while":[210],"being":[211],"comparable":[212],"more":[214],"efficient":[216],"than":[217],"further":[218],"optimized":[219],"GPU":[220],"solutions.":[221]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-03-27T00:00:00"}
