{"id":"https://openalex.org/W2106840144","doi":"https://doi.org/10.1109/apcsac.2008.4625471","title":"Profile guided optimization for dataflow predication","display_name":"Profile guided optimization for dataflow predication","publication_year":2008,"publication_date":"2008-08-01","ids":{"openalex":"https://openalex.org/W2106840144","doi":"https://doi.org/10.1109/apcsac.2008.4625471","mag":"2106840144"},"language":"en","primary_location":{"id":"doi:10.1109/apcsac.2008.4625471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apcsac.2008.4625471","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 13th Asia-Pacific Computer Systems Architecture Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100382429","display_name":"Wang Li","orcid":"https://orcid.org/0000-0003-1286-4407"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Li Wang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085758579","display_name":"Hong An","orcid":"https://orcid.org/0000-0002-3900-3722"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong An","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012651330","display_name":"Yongqing Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongqing Ren","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030366532","display_name":"Yaobin Wang","orcid":"https://orcid.org/0000-0001-9028-7911"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaobin Wang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100382429"],"corresponding_institution_ids":["https://openalex.org/I126520041","https://openalex.org/I19820366"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.09333126,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.9522769451141357},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8411051630973816},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8242828845977783},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7163273096084595},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6125357747077942},{"id":"https://openalex.org/keywords/serialization","display_name":"Serialization","score":0.5959743857383728},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.5232036113739014},{"id":"https://openalex.org/keywords/power-consumption","display_name":"Power consumption","score":0.49973320960998535},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.47107046842575073},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.45177289843559265},{"id":"https://openalex.org/keywords/dataflow-architecture","display_name":"Dataflow architecture","score":0.41058918833732605},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.24643364548683167},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.22365015745162964}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.9522769451141357},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8411051630973816},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8242828845977783},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7163273096084595},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6125357747077942},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.5959743857383728},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.5232036113739014},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.49973320960998535},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.47107046842575073},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.45177289843559265},{"id":"https://openalex.org/C176727019","wikidata":"https://www.wikidata.org/wiki/Q1172415","display_name":"Dataflow architecture","level":3,"score":0.41058918833732605},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.24643364548683167},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.22365015745162964},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apcsac.2008.4625471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apcsac.2008.4625471","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 13th Asia-Pacific Computer Systems Architecture Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W12207660","https://openalex.org/W2015509025","https://openalex.org/W2084451631","https://openalex.org/W2101134669","https://openalex.org/W2113174625","https://openalex.org/W2116299797","https://openalex.org/W2129192659","https://openalex.org/W2129962996","https://openalex.org/W2134218813","https://openalex.org/W2136882019","https://openalex.org/W2137081678","https://openalex.org/W2140311411","https://openalex.org/W2142422634","https://openalex.org/W2143756982","https://openalex.org/W2147345262","https://openalex.org/W2154332652","https://openalex.org/W2163599246","https://openalex.org/W2163870456","https://openalex.org/W2295946175","https://openalex.org/W2576288252","https://openalex.org/W4236752439","https://openalex.org/W4246413825","https://openalex.org/W4251785457","https://openalex.org/W4253277575","https://openalex.org/W6675115123","https://openalex.org/W6683751876"],"related_works":["https://openalex.org/W2564598376","https://openalex.org/W1484403103","https://openalex.org/W2584408851","https://openalex.org/W2115158825","https://openalex.org/W2101960124","https://openalex.org/W4377693460","https://openalex.org/W2033683327","https://openalex.org/W2783505431","https://openalex.org/W2187181201","https://openalex.org/W2521947294"],"abstract_inverted_index":{"Dataflow":[0],"predication":[1],"provides":[2],"a":[3,73],"lightweight":[4],"full":[5],"support":[6],"for":[7,25],"predicated":[8],"execution":[9],"in":[10,89,129,148],"dataflow-like":[11],"architectures.":[12],"One":[13],"of":[14,22,41],"its":[15],"major":[16],"overhead":[17],"is":[18,60],"the":[19,37,87,94],"large":[20],"amounts":[21],"fanout":[23,131],"trees":[24],"distributing":[26],"predicates":[27],"to":[28,51,77,85,91],"all":[29],"dependant":[30],"instructions.":[31],"Conventional":[32],"optimizations":[33],"are":[34],"predicating":[35,99,105,139,146],"only":[36],"heads":[38,59,106,140],"or":[39,96],"tails":[40,45,100,147],"dataflow":[42],"chains.":[43],"Predicating":[44,58],"offers":[46],"more":[47],"speculation":[48,65],"but":[49,63],"leads":[50],"resource":[52,117],"contentions":[53],"and":[54,66,104,116,141],"power":[55,61,115],"consumption":[56],"increasing.":[57],"efficient":[62],"reduces":[64],"instruction":[67],"level":[68],"parallelism.":[69],"This":[70],"paper":[71],"introduces":[72],"profile":[74,124],"guided":[75,125],"technique":[76,111],"combine":[78],"these":[79],"optimizations.":[80],"It":[81,133],"uses":[82],"profiling":[83],"feedback":[84],"guide":[86],"compiler":[88],"deciding":[90],"predicate":[92],"at":[93],"head":[95],"tail.":[97],"By":[98],"on":[101,107],"hot":[102],"paths":[103],"infrequent":[108],"paths,":[109],"this":[110],"can":[112],"get":[113],"performance,":[114],"efficiency.":[118],"Performance":[119],"evaluation":[120],"result":[121],"shows":[122],"that":[123],"optimization":[126],"performs":[127],"better":[128],"removing":[130],"trees.":[132],"has":[134],"10.6%":[135],"speedup":[136,143],"over":[137,144],"always":[138,145],"2.5%":[142],"performance.":[149]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
