{"id":"https://openalex.org/W4414909298","doi":"https://doi.org/10.1109/cluster59342.2025.11186493","title":"Towards High-Performance and Portable Molecular Docking on CPUs Through Vectorization","display_name":"Towards High-Performance and Portable Molecular Docking on CPUs Through Vectorization","publication_year":2025,"publication_date":"2025-09-02","ids":{"openalex":"https://openalex.org/W4414909298","doi":"https://doi.org/10.1109/cluster59342.2025.11186493"},"language":"en","primary_location":{"id":"doi:10.1109/cluster59342.2025.11186493","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cluster59342.2025.11186493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Cluster Computing (CLUSTER)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hdl.handle.net/11311/1297908","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055263185","display_name":"Gianmarco Accordi","orcid":"https://orcid.org/0000-0001-8023-2108"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Gianmarco Accordi","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039069961","display_name":"Jens Domke","orcid":"https://orcid.org/0000-0002-5343-414X"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jens Domke","raw_affiliation_strings":["RIKEN Center for Computational Science,Kobe,Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science,Kobe,Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079210568","display_name":"Theresa Pollinger","orcid":"https://orcid.org/0000-0002-0186-4340"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Theresa Pollinger","raw_affiliation_strings":["RIKEN Center for Computational Science,Kobe,Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science,Kobe,Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059293847","display_name":"Davide Gadioli","orcid":"https://orcid.org/0000-0002-0143-0737"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Davide Gadioli","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077005193","display_name":"Gianluca Palermo","orcid":"https://orcid.org/0000-0001-7955-8012"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Gianluca Palermo","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria,Milan,Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5055263185"],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.15247356,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13182","display_name":"Quantum-Dot Cellular Automata","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13052","display_name":"Molecular Communication and Nanonetworks","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.7904999852180481},{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.786899983882904},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.7386000156402588},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6273999810218811},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.4968000054359436},{"id":"https://openalex.org/keywords/codebase","display_name":"Codebase","score":0.4948999881744385},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.41670000553131104},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.3749000132083893}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7943000197410583},{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.7904999852180481},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.786899983882904},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.7386000156402588},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6273999810218811},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.4968000054359436},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.4948999881744385},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4779999852180481},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.44130000472068787},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.41670000553131104},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3749000132083893},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.34540000557899475},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.34369999170303345},{"id":"https://openalex.org/C34165917","wikidata":"https://www.wikidata.org/wiki/Q188267","display_name":"Programming paradigm","level":2,"score":0.3336000144481659},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3310999870300293},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.3294000029563904},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3183000087738037},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.3084999918937683},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.2919999957084656},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.2563999891281128},{"id":"https://openalex.org/C76752949","wikidata":"https://www.wikidata.org/wiki/Q7607499","display_name":"Stencil","level":2,"score":0.25380000472068787}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cluster59342.2025.11186493","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cluster59342.2025.11186493","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Cluster Computing (CLUSTER)","raw_type":"proceedings-article"},{"id":"pmh:oai:re.public.polimi.it:11311/1297908","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1297908","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:re.public.polimi.it:11311/1297908","is_oa":true,"landing_page_url":"https://hdl.handle.net/11311/1297908","pdf_url":null,"source":{"id":"https://openalex.org/S4306400312","display_name":"Virtual Community of Pathological Anatomy (University of Castilla La Mancha)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79189158","host_organization_name":"University of Castilla-La Mancha","host_organization_lineage":["https://openalex.org/I79189158"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"trends":[1],"in":[2],"the":[3,39,51,100,110],"HPC":[4,94],"field":[5],"have":[6],"introduced":[7],"new":[8],"CPU":[9],"architectures":[10,156],"with":[11,73],"improved":[12],"vectorization":[13,65,152],"capabilities":[14],"that":[15,136],"require":[16],"optimization":[17,106],"to":[18,66,109,130,149],"achieve":[19,67,140],"peak":[20],"performance":[21,27,68,128,143],"and":[22,41,57,63,105,161],"thus":[23],"pose":[24],"challenges":[25],"for":[26,35,43,116],"portability.":[28],"The":[29],"deployment":[30],"of":[31,113],"high-performing":[32],"scientific":[33,114],"applications":[34,47,115],"CPUs":[36,72,138],"requires":[37],"adapting":[38],"codebase":[40],"optimizing":[42],"performance.":[44],"Evaluating":[45],"these":[46],"provides":[48],"insights":[49,98],"into":[50,99],"complex":[52],"interactions":[53],"between":[54],"code,":[55],"compilers,":[56],"hardware.":[58],"We":[59,76,96],"evaluate":[60],"compiler":[61],"auto-vectorization":[62],"explicit":[64,131],"portability":[69],"across":[70,93],"modern":[71],"long":[74],"vectors.":[75],"select":[77],"a":[78,83],"molecular":[79],"docking":[80],"application":[81],"as":[82,86],"case":[84],"study,":[85],"it":[87],"represents":[88],"computational":[89],"patterns":[90],"commonly":[91],"found":[92],"workloads.":[95],"report":[97],"technical":[101],"challenges,":[102],"architectural":[103],"trends,":[104],"strategies":[107],"relevant":[108],"future":[111],"development":[112],"HPC.":[117],"Our":[118],"results":[119],"show":[120],"which":[121],"code":[122],"transformations":[123],"enable":[124],"portable":[125],"auto-vectorization,":[126],"reaching":[127],"similar":[129],"vectorization.":[132],"Experimental":[133],"data":[134],"confirms":[135],"x86":[137],"typically":[139],"higher":[141],"execution":[142],"than":[144],"ARM":[145,155],"CPUs,":[146],"primarily":[147],"due":[148],"their":[150],"wider":[151],"units.":[153],"However,":[154],"demonstrate":[157],"competitive":[158],"energy":[159],"consumption":[160],"cost-effectiveness.":[162]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
