{"id":"https://openalex.org/W2106840144","doi":"https://doi.org/10.1109/apcsac.2008.4625471","title":"Profile guided optimization for dataflow predication","display_name":"Profile guided optimization for dataflow predication","publication_year":2008,"publication_date":"2008-08-01","ids":{"openalex":"https://openalex.org/W2106840144","doi":"https://doi.org/10.1109/apcsac.2008.4625471","mag":"2106840144"},"language":"en","primary_location":{"id":"doi:10.1109/apcsac.2008.4625471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apcsac.2008.4625471","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 13th Asia-Pacific Computer Systems Architecture Conference","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100382429","display_name":"Wang Li","orcid":"https://orcid.org/0000-0003-1286-4407"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Li Wang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085758579","display_name":"Hong An","orcid":"https://orcid.org/0000-0002-3900-3722"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong An","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012651330","display_name":"Yongqing Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongqing Ren","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030366532","display_name":"Yaobin Wang","orcid":"https://orcid.org/0000-0001-9028-7911"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaobin Wang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei 230026, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Key Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.09752965,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.9522769451141357},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.8411051630973816},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8242828845977783},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7163273096084595},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.6125357747077942},{"id":"https://openalex.org/keywords/serialization","display_name":"Serialization","score":0.5959743857383728},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.5232036113739014},{"id":"https://openalex.org/keywords/power-consumption","display_name":"Power consumption","score":0.49973320960998535},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.47107046842575073},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.45177289843559265},{"id":"https://openalex.org/keywords/dataflow-architecture","display_name":"Dataflow architecture","score":0.41058918833732605},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.24643364548683167},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.22365015745162964}],"concepts":[{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.9522769451141357},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.8411051630973816},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8242828845977783},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7163273096084595},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.6125357747077942},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.5959743857383728},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.5232036113739014},{"id":"https://openalex.org/C2984118289","wikidata":"https://www.wikidata.org/wiki/Q29954","display_name":"Power consumption","level":3,"score":0.49973320960998535},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.47107046842575073},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.45177289843559265},{"id":"https://openalex.org/C176727019","wikidata":"https://www.wikidata.org/wiki/Q1172415","display_name":"Dataflow architecture","level":3,"score":0.41058918833732605},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.24643364548683167},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.22365015745162964},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apcsac.2008.4625471","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apcsac.2008.4625471","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 13th Asia-Pacific Computer Systems Architecture Conference","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.6299999952316284,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W12207660","https://openalex.org/W2015509025","https://openalex.org/W2084451631","https://openalex.org/W2101134669","https://openalex.org/W2113174625","https://openalex.org/W2116299797","https://openalex.org/W2129192659","https://openalex.org/W2129962996","https://openalex.org/W2134218813","https://openalex.org/W2136882019","https://openalex.org/W2137081678","https://openalex.org/W2140311411","https://openalex.org/W2142422634","https://openalex.org/W2143756982","https://openalex.org/W2147345262","https://openalex.org/W2154332652","https://openalex.org/W2163599246","https://openalex.org/W2163870456","https://openalex.org/W2295946175","https://openalex.org/W2576288252","https://openalex.org/W4236752439","https://openalex.org/W4246413825","https://openalex.org/W4251785457","https://openalex.org/W4253277575","https://openalex.org/W6675115123","https://openalex.org/W6683751876"],"related_works":["https://openalex.org/W2564598376","https://openalex.org/W1484403103","https://openalex.org/W2584408851","https://openalex.org/W2115158825","https://openalex.org/W2101960124","https://openalex.org/W4377693460","https://openalex.org/W2033683327","https://openalex.org/W2783505431","https://openalex.org/W2187181201","https://openalex.org/W2521947294"],"abstract_inverted_index":{"Dataflow":[0],"predication":[1],"provides":[2],"a":[3,73],"lightweight":[4],"full":[5],"support":[6],"for":[7,25],"predicated":[8],"execution":[9],"in":[10,89,129,148],"dataflow-like":[11],"architectures.":[12],"One":[13],"of":[14,22,41],"its":[15],"major":[16],"overhead":[17],"is":[18,60],"the":[19,37,87,94],"large":[20],"amounts":[21],"fanout":[23,131],"trees":[24],"distributing":[26],"predicates":[27],"to":[28,51,77,85,91],"all":[29],"dependant":[30],"instructions.":[31],"Conventional":[32],"optimizations":[33],"are":[34],"predicating":[35,99,105,139,146],"only":[36],"heads":[38,59,106,140],"or":[39,96],"tails":[40,45,100,147],"dataflow":[42],"chains.":[43],"Predicating":[44,58],"offers":[46],"more":[47],"speculation":[48,65],"but":[49,63],"leads":[50],"resource":[52,117],"contentions":[53],"and":[54,66,104,116,141],"power":[55,61,115],"consumption":[56],"increasing.":[57],"efficient":[62],"reduces":[64],"instruction":[67],"level":[68],"parallelism.":[69],"This":[70],"paper":[71],"introduces":[72],"profile":[74,124],"guided":[75,125],"technique":[76,111],"combine":[78],"these":[79],"optimizations.":[80],"It":[81,133],"uses":[82],"profiling":[83],"feedback":[84],"guide":[86],"compiler":[88],"deciding":[90],"predicate":[92],"at":[93],"head":[95],"tail.":[97],"By":[98],"on":[101,107],"hot":[102],"paths":[103],"infrequent":[108],"paths,":[109],"this":[110],"can":[112],"get":[113],"performance,":[114],"efficiency.":[118],"Performance":[119],"evaluation":[120],"result":[121],"shows":[122],"that":[123],"optimization":[126],"performs":[127],"better":[128],"removing":[130],"trees.":[132],"has":[134],"10.6%":[135],"speedup":[136,143],"over":[137,144],"always":[138,145],"2.5%":[142],"performance.":[149]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
