{"id":"https://openalex.org/W4412939970","doi":"https://doi.org/10.1109/tc.2025.3595078","title":"Parallelization Strategies for DeepMD-Kit Using OpenMP: Enhancing Efficiency in Machine Learning-Based Molecular Simulations","display_name":"Parallelization Strategies for DeepMD-Kit Using OpenMP: Enhancing Efficiency in Machine Learning-Based Molecular Simulations","publication_year":2025,"publication_date":"2025-08-04","ids":{"openalex":"https://openalex.org/W4412939970","doi":"https://doi.org/10.1109/tc.2025.3595078"},"language":"en","primary_location":{"id":"doi:10.1109/tc.2025.3595078","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3595078","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Qi Du","orcid":"https://orcid.org/0009-0008-1584-5360"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qi Du","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","College of Computer Science and Electronic Engineering at Hunan University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"College of Computer Science and Electronic Engineering at Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Feng Wang","orcid":"https://orcid.org/0009-0002-4009-6783"},"institutions":[{"id":"https://openalex.org/I16609230","display_name":"Hunan University","ror":"https://ror.org/05htk5m33","country_code":"CN","type":"education","lineage":["https://openalex.org/I16609230"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Wang","raw_affiliation_strings":["College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","College of Computer Science and Electronic Engineering at Hunan University, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Electronic Engineering, Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]},{"raw_affiliation_string":"College of Computer Science and Electronic Engineering at Hunan University, Changsha, China","institution_ids":["https://openalex.org/I16609230"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054335730","display_name":"Chengkun Wu","orcid":"https://orcid.org/0000-0002-9688-5311"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengkun Wu","raw_affiliation_strings":["College of Computer Science and Technology, National University of Defense Technology, Changsha, China","College of Computer Science and Technology at National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"College of Computer Science and Technology at National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I16609230"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13703607,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"74","issue":"10","first_page":"3534","last_page":"3545"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12867","display_name":"Advanced Biosensing Techniques and Applications","score":0.9020000100135803,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9003999829292297,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7963481545448303},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7566124796867371},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5262916684150696},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3355366587638855},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.32822299003601074}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7963481545448303},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7566124796867371},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5262916684150696},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3355366587638855},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.32822299003601074}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tc.2025.3595078","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tc.2025.3595078","pdf_url":null,"source":{"id":"https://openalex.org/S157670870","display_name":"IEEE Transactions on Computers","issn_l":"0018-9340","issn":["0018-9340","1557-9956","2326-3814"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Computers","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3602879582","display_name":null,"funder_award_id":"2022YFA1004303","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1031578623","https://openalex.org/W1971346858","https://openalex.org/W1978101105","https://openalex.org/W2060079863","https://openalex.org/W2136434791","https://openalex.org/W2144141804","https://openalex.org/W2153789213","https://openalex.org/W2171268876","https://openalex.org/W2742127985","https://openalex.org/W2884767181","https://openalex.org/W3006005697","https://openalex.org/W3027308092","https://openalex.org/W3046751266","https://openalex.org/W3082141065","https://openalex.org/W3201073812","https://openalex.org/W4220914069","https://openalex.org/W4383995031"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"DeepMD-kit":[0,22],"enables":[1],"deep":[2],"learning-based":[3],"molecular":[4],"dynamics":[5],"(MD)":[6],"simulations":[7],"that":[8],"require":[9],"efficient":[10],"parallelization":[11],"to":[12,27,57,59,69,97],"leverage":[13],"modern":[14],"HPC":[15],"architectures.":[16],"In":[17],"this":[18],"work,":[19],"we":[20],"optimize":[21],"using":[23],"advanced":[24],"OpenMP":[25],"strategies":[26],"improve":[28],"scalability":[29],"and":[30,53,62,87],"computational":[31],"efficiency":[32,67],"on":[33],"an":[34],"ARMv8":[35],"processor-based":[36],"server.":[37],"Our":[38],"optimizations":[39],"include":[40],"data":[41],"parallelism":[42],"for":[43],"neural":[44],"network":[45],"inference,":[46],"force":[47],"calculation":[48],"acceleration,":[49],"NUMAaware":[50],"memory":[51,65],"management,":[52],"synchronization":[54,99],"reductions,":[55],"leading":[56],"up":[58],"4.1\u00d7":[60],"speedup":[61,78],"82%":[63],"higher":[64],"band-width":[66],"compared":[68],"the":[70],"baseline":[71],"implementation.":[72],"Strong":[73],"scaling":[74],"analysis":[75],"demonstrates":[76],"superlinear":[77],"at":[79,93],"mid-range":[80],"core":[81],"counts,":[82],"with":[83],"improved":[84],"workload":[85],"balancing":[86],"vectorized":[88],"computations.":[89],"However,":[90],"challenges":[91],"remain":[92],"ultra-large":[94],"scales":[95],"due":[96],"increasing":[98],"overhead.":[100]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
