{"id":"https://openalex.org/W2589144156","doi":"https://doi.org/10.1109/lca.2017.2672559","title":"Transcending Hardware Limits with Software Out-of-Order Processing","display_name":"Transcending Hardware Limits with Software Out-of-Order Processing","publication_year":2017,"publication_date":"2017-02-22","ids":{"openalex":"https://openalex.org/W2589144156","doi":"https://doi.org/10.1109/lca.2017.2672559","mag":"2589144156"},"language":"en","primary_location":{"id":"doi:10.1109/lca.2017.2672559","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lca.2017.2672559","pdf_url":null,"source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069683581","display_name":"Trevor E. Carlson","orcid":"https://orcid.org/0000-0001-8742-134X"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Trevor E. Carlson","raw_affiliation_strings":["Uppsala University, Uppsala, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-8742-134X","affiliations":[{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076024711","display_name":"Kim-Anh Tran","orcid":"https://orcid.org/0000-0003-4988-505X"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Kim-Anh Tran","raw_affiliation_strings":["Uppsala University, Uppsala, Sweden"],"raw_orcid":"https://orcid.org/0000-0003-4988-505X","affiliations":[{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039379608","display_name":"Alexandra Jimborean","orcid":"https://orcid.org/0000-0001-8642-2447"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Alexandra Jimborean","raw_affiliation_strings":["Uppsala University, Uppsala, Sweden"],"raw_orcid":"https://orcid.org/0000-0001-8642-2447","affiliations":[{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038256203","display_name":"Konstantinos Koukos","orcid":"https://orcid.org/0000-0002-9460-1290"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Konstantinos Koukos","raw_affiliation_strings":["Uppsala University, Uppsala, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024358692","display_name":"Magnus Sj\u00e4lander","orcid":"https://orcid.org/0000-0003-4232-6976"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]},{"id":"https://openalex.org/I204778367","display_name":"Norwegian University of Science and Technology","ror":"https://ror.org/05xg72x27","country_code":"NO","type":"education","lineage":["https://openalex.org/I204778367"]}],"countries":["NO","SE"],"is_corresponding":false,"raw_author_name":"Magnus Sjalander","raw_affiliation_strings":["Norwegian University of Science and Technology (NTNU), Trondheim, Norway","Uppsala University, Uppsala, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Norwegian University of Science and Technology (NTNU), Trondheim, Norway","institution_ids":["https://openalex.org/I204778367"]},{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020214726","display_name":"Stefanos Kaxiras","orcid":"https://orcid.org/0000-0001-8267-0232"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Stefanos Kaxiras","raw_affiliation_strings":["Uppsala University, Uppsala, Sweden"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Uppsala University, Uppsala, Sweden","institution_ids":["https://openalex.org/I123387679"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.01784892,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"16","issue":"2","first_page":"162","last_page":"165"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11005","display_name":"Radiation Effects in Electronics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.814750075340271},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.7303525805473328},{"id":"https://openalex.org/keywords/out-of-order-execution","display_name":"Out-of-order execution","score":0.6583542227745056},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.586524248123169},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5452495217323303},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.5208266973495483},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.5137273073196411},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.5052366852760315},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.4614395499229431},{"id":"https://openalex.org/keywords/instructions-per-cycle","display_name":"Instructions per cycle","score":0.4104631841182709},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3846789300441742},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3247220516204834},{"id":"https://openalex.org/keywords/central-processing-unit","display_name":"Central processing unit","score":0.1500234603881836},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.10469996929168701}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.814750075340271},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.7303525805473328},{"id":"https://openalex.org/C1793878","wikidata":"https://www.wikidata.org/wiki/Q1153762","display_name":"Out-of-order execution","level":2,"score":0.6583542227745056},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.586524248123169},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5452495217323303},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.5208266973495483},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.5137273073196411},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.5052366852760315},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.4614395499229431},{"id":"https://openalex.org/C156972235","wikidata":"https://www.wikidata.org/wiki/Q1443434","display_name":"Instructions per cycle","level":3,"score":0.4104631841182709},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3846789300441742},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3247220516204834},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.1500234603881836},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.10469996929168701},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lca.2017.2672559","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lca.2017.2672559","pdf_url":null,"source":{"id":"https://openalex.org/S17643076","display_name":"IEEE Computer Architecture Letters","issn_l":"1556-6056","issn":["1556-6056","1556-6064","2473-2575"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Computer Architecture Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.9100000262260437}],"awards":[{"id":"https://openalex.org/G6281187374","display_name":null,"funder_award_id":"C0533201","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"},{"id":"https://openalex.org/G794501901","display_name":null,"funder_award_id":"610490","funder_id":"https://openalex.org/F4320334960","funder_display_name":"Seventh Framework Programme"}],"funders":[{"id":"https://openalex.org/F4320322581","display_name":"Vetenskapsr\u00e5det","ror":"https://ror.org/03zttf063"},{"id":"https://openalex.org/F4320334960","display_name":"Seventh Framework Programme","ror":"https://ror.org/00k4n6c32"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2019674193","https://openalex.org/W2100869242","https://openalex.org/W2133356510","https://openalex.org/W2167850096","https://openalex.org/W2169229905","https://openalex.org/W2170675137","https://openalex.org/W2239894058","https://openalex.org/W2296006986","https://openalex.org/W2297094725","https://openalex.org/W4238437267","https://openalex.org/W4247317410","https://openalex.org/W6655537688","https://openalex.org/W6679671849"],"related_works":["https://openalex.org/W2026084820","https://openalex.org/W2171175484","https://openalex.org/W2533681803","https://openalex.org/W2562747857","https://openalex.org/W2027935151","https://openalex.org/W4250432526","https://openalex.org/W2101536355","https://openalex.org/W2112915496","https://openalex.org/W2169029159","https://openalex.org/W2055341571"],"abstract_inverted_index":{"Building":[0],"high-performance,":[1],"next-generation":[2],"processors":[3],"require":[4],"novel":[5],"techniques":[6],"to":[7,31,41,63,68,120],"enable":[8],"improved":[9],"performance":[10,25,96,157],"given":[11],"today's":[12],"power-":[13],"and":[14,23,71,77,117],"energy-efficiency":[15],"requirements.":[16],"Additionally,":[17],"a":[18,154],"widening":[19],"gap":[20],"between":[21],"processor":[22,138],"memory":[24,44],"makes":[26],"it":[27],"even":[28],"more":[29],"difficult":[30],"improve":[32,72],"efficiency":[33,54,76,93],"with":[34,46,140,162,167],"conventional":[35,136],"techniques.":[36],"While":[37],"out-of-order":[38],"architectures":[39],"attempt":[40],"hide":[42],"this":[43,81],"latency":[45,106],"dynamically":[47],"reordered":[48],"instructions,":[49],"they":[50],"lack":[51],"the":[52,65,108,130,135,141],"energy":[53,75,92,169],"seen":[55],"in":[56,97],"in-order":[57,88],"processors.":[58],"Thus,":[59],"our":[60],"goal":[61],"is":[62],"reorder":[64],"instruction":[66,127],"stream":[67],"avoid":[69],"stalls":[70],"utilization":[73],"for":[74],"performance.":[78],"To":[79],"accomplish":[80],"goal,":[82],"we":[83],"propose":[84],"an":[85,163,168],"enhanced":[86],"stall-on-use":[87,165],"core":[89,113,132],"that":[90,151],"improves":[91],"(and":[94],"therefore":[95],"these":[98],"power-limited":[99],"designes)":[100],"through":[101],"out-of-program-order":[102],"execution.":[103],"During":[104],"long":[105],"loads,":[107],"Software":[109],"Out-of-Order":[110],"Processing":[111],"(SWOOP)":[112],"exposes":[114],"additional":[115],"memory-":[116],"instruction-level":[118],"parallelism":[119],"perform":[121],"useful,":[122],"non-speculative":[123],"work.":[124],"The":[125],"resulting":[126],"lookahead":[128],"of":[129,143,171],"SWOOP":[131,152],"reaches":[133],"beyond":[134],"fixed-sized":[137],"structures":[139],"help":[142],"transparent":[144],"hardware":[145],"register":[146],"contexts.":[147],"Our":[148],"results":[149],"show":[150],"demonstrates":[153],"34":[155],"percent":[156],"improvement":[158],"on":[159],"average":[160],"compared":[161],"in-order,":[164],"core,":[166],"reduction":[170],"23":[172],"percent.":[173]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
