{"id":"https://openalex.org/W4411143928","doi":"https://doi.org/10.1109/mm.2025.3577524","title":"Scalar Vector Runahead: Removing the Shackles of Indirect Memory Chains on In-Order Cores","display_name":"Scalar Vector Runahead: Removing the Shackles of Indirect Memory Chains on In-Order Cores","publication_year":2025,"publication_date":"2025-06-09","ids":{"openalex":"https://openalex.org/W4411143928","doi":"https://doi.org/10.1109/mm.2025.3577524"},"language":"en","primary_location":{"id":"doi:10.1109/mm.2025.3577524","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2025.3577524","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://biblio.ugent.be/publication/01KAV5NXVGFYFQVQ729PMTGGSS/file/01KAV616XGH3HJRTSVKJAKQMYX.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093450444","display_name":"Jaime Roelandts","orcid":"https://orcid.org/0000-0001-8937-6888"},"institutions":[{"id":"https://openalex.org/I2801227569","display_name":"Ghent University Hospital","ror":"https://ror.org/00xmkp704","country_code":"BE","type":"healthcare","lineage":["https://openalex.org/I2801227569"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Jaime Roelandts","raw_affiliation_strings":["Ghent University, Ghent, Belgium"],"affiliations":[{"raw_affiliation_string":"Ghent University, Ghent, Belgium","institution_ids":["https://openalex.org/I2801227569"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043018563","display_name":"Ajeya Naithani","orcid":"https://orcid.org/0000-0002-8291-4230"},"institutions":[{"id":"https://openalex.org/I83019370","display_name":"Eindhoven University of Technology","ror":"https://ror.org/02c2kyt77","country_code":"NL","type":"education","lineage":["https://openalex.org/I83019370"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Ajeya Naithani","raw_affiliation_strings":["TU Eindhoven, Eindhoven, The Netherlands"],"affiliations":[{"raw_affiliation_string":"TU Eindhoven, Eindhoven, The Netherlands","institution_ids":["https://openalex.org/I83019370"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041446247","display_name":"Sam Ainsworth","orcid":"https://orcid.org/0000-0002-3726-0055"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Sam Ainsworth","raw_affiliation_strings":["University of Edinburgh, Edinburgh, U.K"],"affiliations":[{"raw_affiliation_string":"University of Edinburgh, Edinburgh, U.K","institution_ids":["https://openalex.org/I98677209"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047443783","display_name":"Timothy M. Jones","orcid":"https://orcid.org/0000-0002-4114-7661"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Timothy M. Jones","raw_affiliation_strings":["University of Cambridge, Cambridge, U.K"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, Cambridge, U.K","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033119975","display_name":"Lieven Eeckhout","orcid":"https://orcid.org/0000-0001-8792-4473"},"institutions":[{"id":"https://openalex.org/I2801227569","display_name":"Ghent University Hospital","ror":"https://ror.org/00xmkp704","country_code":"BE","type":"healthcare","lineage":["https://openalex.org/I2801227569"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Lieven Eeckhout","raw_affiliation_strings":["Ghent University, Ghent, Belgium"],"affiliations":[{"raw_affiliation_string":"Ghent University, Ghent, Belgium","institution_ids":["https://openalex.org/I2801227569"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5093450444"],"corresponding_institution_ids":["https://openalex.org/I2801227569"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11648284,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"45","issue":"4","first_page":"72","last_page":"78"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9514999985694885,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9514999985694885,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9431999921798706,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7748806476593018},{"id":"https://openalex.org/keywords/scalar","display_name":"Scalar (mathematics)","score":0.6736539602279663},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5002572536468506},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.42465314269065857},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15670746564865112}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7748806476593018},{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.6736539602279663},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5002572536468506},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.42465314269065857},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15670746564865112},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/mm.2025.3577524","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2025.3577524","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"},{"id":"pmh:oai:archive.ugent.be:01KAV5NXVGFYFQVQ729PMTGGSS","is_oa":true,"landing_page_url":"http://hdl.handle.net/1854/LU-01KAV5NXVGFYFQVQ729PMTGGSS","pdf_url":"https://biblio.ugent.be/publication/01KAV5NXVGFYFQVQ729PMTGGSS/file/01KAV616XGH3HJRTSVKJAKQMYX.pdf","source":{"id":"https://openalex.org/S4306400478","display_name":"Ghent University Academic Bibliography (Ghent University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I32597200","host_organization_name":"Ghent University","host_organization_lineage":["https://openalex.org/I32597200"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISSN: 1937-4143","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.tue.nl:publications/55fc55fa-7f1f-4ede-975d-29a4da2adf86","is_oa":true,"landing_page_url":"https://research.tue.nl/en/publications/55fc55fa-7f1f-4ede-975d-29a4da2adf86","pdf_url":"https://pure.tue.nl/ws/files/382645841/Scalar_Vector_Runahead_Removing_the_Shackles_of_Indirect_Memory_Chains_on_In-Order_Cores.pdf","source":{"id":"https://openalex.org/S4406922641","display_name":"TU/e Research Portal","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Roelandts, J, Naithani, A, Ainsworth, S, Jones, T M & Eeckhout, L 2025, 'Scalar Vector Runahead : Removing the Shackles of Indirect Memory Chains on In-Order Cores', IEEE Micro, vol. 45, no. 4, 11029128, pp. 72-78. https://doi.org/10.1109/MM.2025.3577524","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:doi:10.17863/cam.120072","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"pmh:oai:archive.ugent.be:01KAV5NXVGFYFQVQ729PMTGGSS","is_oa":true,"landing_page_url":"http://hdl.handle.net/1854/LU-01KAV5NXVGFYFQVQ729PMTGGSS","pdf_url":"https://biblio.ugent.be/publication/01KAV5NXVGFYFQVQ729PMTGGSS/file/01KAV616XGH3HJRTSVKJAKQMYX.pdf","source":{"id":"https://openalex.org/S4306400478","display_name":"Ghent University Academic Bibliography (Ghent University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I32597200","host_organization_name":"Ghent University","host_organization_lineage":["https://openalex.org/I32597200"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISSN: 1937-4143","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1313632636","display_name":null,"funder_award_id":"741097","funder_id":"https://openalex.org/F4320334678","funder_display_name":"European Research Council"},{"id":"https://openalex.org/G1824026583","display_name":null,"funder_award_id":"G018722N","funder_id":"https://openalex.org/F4320321730","funder_display_name":"Fonds Wetenschappelijk Onderzoek"},{"id":"https://openalex.org/G7497161057","display_name":"ParaSol: Fine-Grained Thread-Level Parallelism for Single-Threaded Performance","funder_award_id":"EP/W00576X/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320321730","display_name":"Fonds Wetenschappelijk Onderzoek","ror":"https://ror.org/03qtxy027"},{"id":"https://openalex.org/F4320327336","display_name":"Vlaamse regering","ror":null},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334678","display_name":"European Research Council","ror":"https://ror.org/0472cxd90"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4411143928.pdf","grobid_xml":"https://content.openalex.org/works/W4411143928.grobid-xml"},"referenced_works_count":9,"referenced_works":["https://openalex.org/W2009553719","https://openalex.org/W2170794761","https://openalex.org/W2922398414","https://openalex.org/W3194960030","https://openalex.org/W3205916498","https://openalex.org/W4389491899","https://openalex.org/W4394999098","https://openalex.org/W4395110137","https://openalex.org/W4404955410"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Modern":[0],"processors":[1],"often":[2],"face":[3],"the":[4,59,121],"memory":[5,66,77,85,101],"wall":[6],"as":[7],"a":[8,11,92,112,133,149],"significant":[9],"bottleneck,":[10],"problem":[12],"that":[13,61],"becomes":[14],"particularly":[15],"severe":[16],"when":[17],"using":[18],"stall-on-use":[19],"in-order":[20,31,136],"cores.":[21],"Despite":[22],"this":[23],"limitation,":[24],"there":[25],"is":[26],"growing":[27],"demand":[28],"for":[29,123],"energy-efficient":[30],"cores":[32],"due":[33],"to":[34,63,104,107],"privacy":[35],"and":[36,79,119,144],"sustainability":[37],"concerns.":[38],"Scalar":[39],"Vector":[40],"Runahead":[41],"(SVR)1":[42],"provides":[43],"an":[44,140],"elegant":[45],"solution":[46],"by":[47,83,139],"extracting":[48],"high":[49],"memory-level":[50],"parallelism":[51],"through":[52],"piggybacking":[53],"on":[54,58],"existing":[55],"instructions":[56],"executed":[57],"processor":[60],"lead":[62],"future":[64],"irregular":[65],"accesses.":[67],"SVR":[68,127],"speculatively":[69],"executes":[70],"multiple":[71],"transient,":[72],"independent,":[73],"parallel":[74],"instances":[75],"of":[76,91,115],"accesses":[78,86,102],"their":[80],"instruction":[81],"chains,":[82],"initiating":[84],"from":[87],"many":[88],"different":[89],"values":[90],"predicted":[93],"induction":[94],"variable.":[95],"This":[96],"approach":[97],"moves":[98],"mutually":[99],"independent":[100],"next":[103],"each":[105],"other":[106],"hide":[108],"dependent":[109],"stalls.":[110],"With":[111],"hardware":[113,124],"overhead":[114],"only":[116],"2":[117],"KiB":[118],"without":[120],"need":[122],"vector":[125],"extensions,":[126],"delivers":[128],"3.2\u00d7":[129],"higher":[130,146],"performance":[131,147],"than":[132,148],"baseline":[134],"3-wide":[135],"core":[137],"inspired":[138],"Arm":[141],"Cortex":[142],"A510,":[143],"1.3\u00d7":[145],"full":[150],"out-of-order":[151],"core,":[152],"while":[153],"halving":[154],"energy":[155],"consumption.":[156]},"counts_by_year":[],"updated_date":"2026-04-16T15:07:20.185449","created_date":"2025-10-10T00:00:00"}
