{"id":"https://openalex.org/W2252549844","doi":"https://doi.org/10.1007/978-1-4419-6935-4_20","title":"Autotuning and Specialization: Speeding up Matrix Multiply for Small Matrices with Compiler Technology","display_name":"Autotuning and Specialization: Speeding up Matrix Multiply for Small Matrices with Compiler Technology","publication_year":2010,"publication_date":"2010-08-13","ids":{"openalex":"https://openalex.org/W2252549844","doi":"https://doi.org/10.1007/978-1-4419-6935-4_20","mag":"2252549844"},"language":"en","primary_location":{"id":"doi:10.1007/978-1-4419-6935-4_20","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-1-4419-6935-4_20","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software Automatic Tuning","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023732376","display_name":"Jaewook Shin","orcid":"https://orcid.org/0000-0002-0342-1834"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jaewook Shin","raw_affiliation_strings":["Mathematics and Computer Science Division, Argonne National Laboratory, Argonne, IL, 60439, USA"],"affiliations":[{"raw_affiliation_string":"Mathematics and Computer Science Division, Argonne National Laboratory, Argonne, IL, 60439, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030152493","display_name":"Mary Hall","orcid":"https://orcid.org/0000-0002-3058-7573"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mary W. Hall","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057351225","display_name":"Jacqueline Chame","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jacqueline Chame","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103956520","display_name":"Chun Chen","orcid":"https://orcid.org/0009-0005-8416-9587"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chun Chen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5067040957","display_name":"Paul Hovland","orcid":"https://orcid.org/0000-0002-0907-2567"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Paul D. Hovland","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5023732376"],"corresponding_institution_ids":["https://openalex.org/I1282105669"],"apc_list":null,"apc_paid":null,"fwci":3.3288,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.9256651,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"353","last_page":"370"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8240360021591187},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.8230827450752258},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6195434331893921},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.4901178777217865},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.4785500168800354},{"id":"https://openalex.org/keywords/program-optimization","display_name":"Program optimization","score":0.45822039246559143},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.4385259449481964},{"id":"https://openalex.org/keywords/optimizing-compiler","display_name":"Optimizing compiler","score":0.4325544238090515},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4205150008201599},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.41961869597435},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4161491096019745},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.39428114891052246},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1156783401966095}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8240360021591187},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.8230827450752258},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6195434331893921},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.4901178777217865},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.4785500168800354},{"id":"https://openalex.org/C139571649","wikidata":"https://www.wikidata.org/wiki/Q1156793","display_name":"Program optimization","level":3,"score":0.45822039246559143},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.4385259449481964},{"id":"https://openalex.org/C190902152","wikidata":"https://www.wikidata.org/wiki/Q1325106","display_name":"Optimizing compiler","level":3,"score":0.4325544238090515},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4205150008201599},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.41961869597435},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4161491096019745},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.39428114891052246},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1156783401966095}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/978-1-4419-6935-4_20","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-1-4419-6935-4_20","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Software Automatic Tuning","raw_type":"book-chapter"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.155.3869","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.155.3869","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-unix.mcs.anl.gov/~jaewook/papers/iwapt09.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.489.2143","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.489.2143","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.mcs.anl.gov/uploads/cels/papers/P1664.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W243738321","https://openalex.org/W1580643653","https://openalex.org/W1604252617","https://openalex.org/W1631114303","https://openalex.org/W1779740778","https://openalex.org/W1972209410","https://openalex.org/W2007451249","https://openalex.org/W2047656763","https://openalex.org/W2064823029","https://openalex.org/W2099059741","https://openalex.org/W2099625934","https://openalex.org/W2104736438","https://openalex.org/W2107404972","https://openalex.org/W2112502633","https://openalex.org/W2119691711","https://openalex.org/W2121546953","https://openalex.org/W2135653967","https://openalex.org/W2136952590","https://openalex.org/W2158626113","https://openalex.org/W2159756807","https://openalex.org/W2314944927","https://openalex.org/W3136479147","https://openalex.org/W4230521896"],"related_works":["https://openalex.org/W2778498407","https://openalex.org/W2577630842","https://openalex.org/W2113798250","https://openalex.org/W1488300410","https://openalex.org/W4320560513","https://openalex.org/W4225492247","https://openalex.org/W2069117531","https://openalex.org/W2083681681","https://openalex.org/W2956382393","https://openalex.org/W1877657449"],"abstract_inverted_index":null,"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
