{"id":"https://openalex.org/W1964191343","doi":"https://doi.org/10.1145/1022969.1022971","title":"Interaction cost and shotgun profiling","display_name":"Interaction cost and shotgun profiling","publication_year":2004,"publication_date":"2004-09-01","ids":{"openalex":"https://openalex.org/W1964191343","doi":"https://doi.org/10.1145/1022969.1022971","mag":"1964191343"},"language":"en","primary_location":{"id":"doi:10.1145/1022969.1022971","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1022969.1022971","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1022969.1022971","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/1022969.1022971","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051753109","display_name":"Brian A. Fields","orcid":null},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian A. Fields","raw_affiliation_strings":["University of California, Berkeley, CA","University of California: Berkeley, CA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Berkeley, CA","institution_ids":["https://openalex.org/I95457486"]},{"raw_affiliation_string":"University of California: Berkeley, CA#TAB#","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085160432","display_name":"Rastislav Bod\u00edk","orcid":"https://orcid.org/0000-0001-6639-1647"},"institutions":[{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rastislav Bodik","raw_affiliation_strings":["University of California, Berkeley, CA","University of California: Berkeley, CA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of California, Berkeley, CA","institution_ids":["https://openalex.org/I95457486"]},{"raw_affiliation_string":"University of California: Berkeley, CA#TAB#","institution_ids":["https://openalex.org/I95457486"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Mark D. Hill","orcid":null},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark D. Hill","raw_affiliation_strings":["University of Wisconsin, Madison, WI","University of Wisconsin - Madison WI#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Wisconsin, Madison, WI","institution_ids":["https://openalex.org/I135310074"]},{"raw_affiliation_string":"University of Wisconsin - Madison WI#TAB#","institution_ids":["https://openalex.org/I135310074"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010832434","display_name":"Chris J. Newburn","orcid":null},"institutions":[{"id":"https://openalex.org/I4210158342","display_name":"Intel (United Kingdom)","ror":"https://ror.org/058cxws58","country_code":"GB","type":"company","lineage":["https://openalex.org/I1343180700","https://openalex.org/I4210158342"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Chris J. Newburn","raw_affiliation_strings":["Intel Corporation"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intel Corporation","institution_ids":["https://openalex.org/I4210158342"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.2401,"has_fulltext":true,"cited_by_count":42,"citation_normalized_percentile":{"value":0.93673669,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"1","issue":"3","first_page":"272","last_page":"304"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.892701268196106},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6099233627319336},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6050565838813782},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.5920261740684509},{"id":"https://openalex.org/keywords/instruction-prefetch","display_name":"Instruction prefetch","score":0.515038251876831},{"id":"https://openalex.org/keywords/spec#","display_name":"Spec#","score":0.4745113253593445},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4587445855140686},{"id":"https://openalex.org/keywords/microarchitecture","display_name":"Microarchitecture","score":0.4504089653491974},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3484593629837036},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.34508049488067627},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.24768909811973572}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.892701268196106},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6099233627319336},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6050565838813782},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.5920261740684509},{"id":"https://openalex.org/C133588205","wikidata":"https://www.wikidata.org/wiki/Q28455645","display_name":"Instruction prefetch","level":3,"score":0.515038251876831},{"id":"https://openalex.org/C2778565505","wikidata":"https://www.wikidata.org/wiki/Q2207566","display_name":"Spec#","level":2,"score":0.4745113253593445},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4587445855140686},{"id":"https://openalex.org/C107598950","wikidata":"https://www.wikidata.org/wiki/Q259864","display_name":"Microarchitecture","level":2,"score":0.4504089653491974},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3484593629837036},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.34508049488067627},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.24768909811973572},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/1022969.1022971","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1022969.1022971","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1022969.1022971","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.70.1364","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.70.1364","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.ece.lsu.edu/tca/papers/fields04interaction.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.94.6507","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.94.6507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.berkeley.edu/~bfields/bafl/taco04.pdf","raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/1022969.1022971","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1022969.1022971","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1022969.1022971","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.7200000286102295}],"awards":[{"id":"https://openalex.org/G103960779","display_name":"CAREER:  Scalable Compiler Optimizations for New Software","funder_award_id":"0093275","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G1241002992","display_name":"ITR/Language-Based Software Security","funder_award_id":"0326577","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G136828258","display_name":"Exploiting the Critical Path in the Design and Performance Analysis of Modern Processors","funder_award_id":"0105721","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G1627295659","display_name":"ITR: The Open Source Quality Project","funder_award_id":"0085949","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G225333856","display_name":"ITR:     Advanced Architectures and Technologies for Chip Multiprocessors","funder_award_id":"0324878","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3033351227","display_name":"ITR: SafetyNet: Synergistic Support for Availability, Designability, Programmability, & Performance","funder_award_id":"0205286","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5510993554","display_name":"CISE Research Infrastructure:  MIDSHIP:  Managing Image Data for Scalable High Performance","funder_award_id":"9623632","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6392137900","display_name":"Experimental Partnerships:  Multifacet:  Exploiting Prediction and Speculation in Multiprocessor Memory Systems","funder_award_id":"9971256","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6671297155","display_name":null,"funder_award_id":"CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7460574776","display_name":"ITR: Foundations of Hybrid and Embedded Software Systems","funder_award_id":"0225610","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7494585381","display_name":"CAREER:  Scalable Compiler Optimizations for New Software","funder_award_id":"0243657","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7907898941","display_name":"NGS:  Wisconsin DOVE: Distributed Optimizing Virtual Environment","funder_award_id":"0103670","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320307762","display_name":"International Business Machines Corporation","ror":"https://ror.org/05hh8d621"},{"id":"https://openalex.org/F4320315711","display_name":"Hill's Pet Nutrition","ror":null},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1964191343.pdf","grobid_xml":"https://content.openalex.org/works/W1964191343.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W1496940124","https://openalex.org/W1555915743","https://openalex.org/W1970963354","https://openalex.org/W1971403296","https://openalex.org/W2032094184","https://openalex.org/W2032732648","https://openalex.org/W2038769854","https://openalex.org/W2073617099","https://openalex.org/W2095667776","https://openalex.org/W2099661831","https://openalex.org/W2100767401","https://openalex.org/W2104205789","https://openalex.org/W2106018697","https://openalex.org/W2108730429","https://openalex.org/W2109659793","https://openalex.org/W2110296438","https://openalex.org/W2111880608","https://openalex.org/W2121050483","https://openalex.org/W2122939826","https://openalex.org/W2123973634","https://openalex.org/W2129094586","https://openalex.org/W2129269323","https://openalex.org/W2129760904","https://openalex.org/W2131498141","https://openalex.org/W2135183949","https://openalex.org/W2140351961","https://openalex.org/W2140384194","https://openalex.org/W2140759096","https://openalex.org/W2146173591","https://openalex.org/W2146307698","https://openalex.org/W2153131460","https://openalex.org/W2154512574","https://openalex.org/W2154693467","https://openalex.org/W2156359950","https://openalex.org/W2157050575","https://openalex.org/W2161910890","https://openalex.org/W2167195409","https://openalex.org/W2171036571","https://openalex.org/W2172190421","https://openalex.org/W2942827234","https://openalex.org/W3142074656","https://openalex.org/W4205854416","https://openalex.org/W4205890323","https://openalex.org/W4229524341","https://openalex.org/W4232019702","https://openalex.org/W4242556421","https://openalex.org/W4254473445","https://openalex.org/W6629902689"],"related_works":["https://openalex.org/W1983529203","https://openalex.org/W1511727231","https://openalex.org/W4381514859","https://openalex.org/W2100495790","https://openalex.org/W2469267785","https://openalex.org/W1578001114","https://openalex.org/W2391224155","https://openalex.org/W987201201","https://openalex.org/W2045913108","https://openalex.org/W2115316748"],"abstract_inverted_index":{"We":[0,170],"observe":[1,147],"that":[2,27,148,238,253],"the":[3,51,59,64,73,77,109,118,193,216,227,275,282],"challenges":[4],"software":[5],"optimizers":[6],"and":[7,49,103,144,153,202,231,306],"microarchitects":[8],"face":[9],"every":[10],"day":[11],"boil":[12],"down":[13],"to":[14,29,54,71,125,140,214,258,269],"a":[15,34,100,104,133,156,205,208,247],"single":[16],"problem:":[17],"bottleneck":[18,21],"analysis.":[19],"A":[20],"is":[22],"any":[23],"event":[24,67,113,138,260],"or":[25,38,168,188],"resource":[26],"contributes":[28],"execution":[30],"time,":[31],"such":[32,42,83,225],"as":[33,43,99,226,301,303],"critical":[35,297],"cache":[36,105,229],"miss":[37],"window":[39],"stall.":[40],"Tasks":[41],"tuning":[44],"processors":[45,81],"for":[46,117,136],"energy":[47],"efficiency":[48],"finding":[50,299],"right":[52],"loads":[53],"prefetch":[55],"all":[56,149],"require":[57],"measuring":[58],"performance":[60,90,218],"costs":[61,139,198,305],"of":[62,79,163,195,220,249,277,281,290],"bottlenecks.In":[63],"past,":[65],"simple":[66],"counts":[68],"were":[69],"enough":[70],"find":[72],"important":[74],"bottlenecks.":[75],"Today,":[76],"parallelism":[78],"modern":[80],"makes":[82],"analysis":[84],"much":[85],"more":[86],"difficult,":[87],"rendering":[88],"traditional":[89,259],"counters":[91],"less":[92],"useful.":[93],"If":[94],"two":[95,164],"microarchitectural":[96],"events":[97,154],"(such":[98],"fetch":[101],"stall":[102],"miss)":[106],"occur":[107],"in":[108,155,160,199,256],"same":[110],"cycle,":[111],"which":[112,179],"should":[114,122],"we":[115,123,131,146,191,211,242],"blame":[116],"cycle?":[119],"What":[120],"cost":[121,177],"assign":[124],"each":[126],"event?":[127],"In":[128,204],"this":[129],"paper,":[130],"introduce":[132],"new":[134],"model":[135],"understanding":[137],"facilitate":[141],"processor":[142,200,206],"design":[143,201,264],"optimization.First,":[145],"instructions,":[150,298],"hardware":[151,250,271],"structures,":[152],"machine":[157],"can":[158,180,292],"interact":[159,239],"only":[161,266],"one":[162],"ways":[165],"(in":[166],"parallel":[167],"serially).":[169],"quantify":[171],"these":[172,285],"interactions":[173],"by":[174,233],"defining":[175],"interaction":[176,197,307],",":[178,246],"be":[181,293],"zero":[182],"(independent,":[183],"no":[184],"interaction),":[185],"positive":[186],"(parallel),":[187],"negative":[189,217],"(serial).Second,":[190],"illustrate":[192],"value":[194],"using":[196],"optimization.":[203],"with":[207,240],"long":[209,221],"pipeline,":[210],"show":[212],"how":[213],"mitigate":[215],"effect":[219],"latency":[222],"\"critical\"":[223],"loops,":[224],"level-one":[228],"access":[230],"issue-wakeup,":[232],"optimizing":[234],"seemingly":[235],"unrelated":[236],"resources":[237],"them.Finally,":[241],"propose":[243],"shotgun":[244],"profiling":[245,251],"class":[248],"infrastructures":[252],"are":[254],"parallelism-aware,":[255],"contrast":[257],"counters.":[261],"Our":[262],"recommended":[263],"requires":[265],"modest":[267],"extensions":[268],"current":[270],"counters,":[272],"while":[273],"enabling":[274],"construction":[276],"full-featured":[278],"dependence":[279,286],"graphs":[280],"microexecution.":[283],"With":[284],"graphs,":[287],"many":[288],"types":[289],"analyses":[291],"performed,":[294],"including":[295],"identifying":[296],"slack,":[300],"well":[302],"computing":[304],"costs.":[308]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
