{"id":"https://openalex.org/W2537178584","doi":"https://doi.org/10.1109/dsaa.2014.7058100","title":"General in-situ matrix transposition algorithm for massively parallel environments","display_name":"General in-situ matrix transposition algorithm for massively parallel environments","publication_year":2014,"publication_date":"2014-10-01","ids":{"openalex":"https://openalex.org/W2537178584","doi":"https://doi.org/10.1109/dsaa.2014.7058100","mag":"2537178584"},"language":"en","primary_location":{"id":"doi:10.1109/dsaa.2014.7058100","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsaa.2014.7058100","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 International Conference on Data Science and Advanced Analytics (DSAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5105764461","display_name":"Marcin Gorawski","orcid":"https://orcid.org/0000-0003-4528-242X"},"institutions":[{"id":"https://openalex.org/I119004910","display_name":"Silesian University of Technology","ror":"https://ror.org/02dyjk442","country_code":"PL","type":"education","lineage":["https://openalex.org/I119004910"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Marcin Gorawski","raw_affiliation_strings":["Politechnika Slaska, Gliwice, PL"],"affiliations":[{"raw_affiliation_string":"Politechnika Slaska, Gliwice, PL","institution_ids":["https://openalex.org/I119004910"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058061541","display_name":"Michal Lorek","orcid":null},"institutions":[{"id":"https://openalex.org/I4210087266","display_name":"Institute of Computer Science","ror":"https://ror.org/003fvp964","country_code":"PL","type":"facility","lineage":["https://openalex.org/I4210087266","https://openalex.org/I99542240"]},{"id":"https://openalex.org/I119004910","display_name":"Silesian University of Technology","ror":"https://ror.org/02dyjk442","country_code":"PL","type":"education","lineage":["https://openalex.org/I119004910"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Michal Lorek","raw_affiliation_strings":["Institute of Computer Science, Silesian University of Technology, Gliwice, Poland"],"affiliations":[{"raw_affiliation_string":"Institute of Computer Science, Silesian University of Technology, Gliwice, Poland","institution_ids":["https://openalex.org/I119004910","https://openalex.org/I4210087266"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5105764461"],"corresponding_institution_ids":["https://openalex.org/I119004910"],"apc_list":null,"apc_paid":null,"fwci":0.3065,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.64271776,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"8","issue":null,"first_page":"379","last_page":"384"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transpose","display_name":"Transpose","score":0.8711177110671997},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7634603381156921},{"id":"https://openalex.org/keywords/massively-parallel","display_name":"Massively parallel","score":0.7630766034126282},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.7502948641777039},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6721234321594238},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.6622469425201416},{"id":"https://openalex.org/keywords/transposition","display_name":"Transposition (logic)","score":0.5431361198425293},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.5052555203437805},{"id":"https://openalex.org/keywords/diagonal","display_name":"Diagonal","score":0.5001533031463623},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4839230179786682},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.48059889674186707},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.43099892139434814},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3856112062931061},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1710158884525299},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.12048473954200745}],"concepts":[{"id":"https://openalex.org/C200106649","wikidata":"https://www.wikidata.org/wiki/Q223683","display_name":"Transpose","level":3,"score":0.8711177110671997},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7634603381156921},{"id":"https://openalex.org/C190475519","wikidata":"https://www.wikidata.org/wiki/Q544384","display_name":"Massively parallel","level":2,"score":0.7630766034126282},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.7502948641777039},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6721234321594238},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.6622469425201416},{"id":"https://openalex.org/C12455157","wikidata":"https://www.wikidata.org/wiki/Q7835331","display_name":"Transposition (logic)","level":2,"score":0.5431361198425293},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.5052555203437805},{"id":"https://openalex.org/C130367717","wikidata":"https://www.wikidata.org/wiki/Q189791","display_name":"Diagonal","level":2,"score":0.5001533031463623},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4839230179786682},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.48059889674186707},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.43099892139434814},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3856112062931061},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1710158884525299},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.12048473954200745},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dsaa.2014.7058100","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsaa.2014.7058100","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2014 International Conference on Data Science and Advanced Analytics (DSAA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1483568252","https://openalex.org/W2026418698","https://openalex.org/W2036895269","https://openalex.org/W2043106819","https://openalex.org/W2061989483","https://openalex.org/W2092139011","https://openalex.org/W2092156305","https://openalex.org/W2102200144","https://openalex.org/W2111309482","https://openalex.org/W2117148224","https://openalex.org/W2123040349","https://openalex.org/W2129541371","https://openalex.org/W2139801399","https://openalex.org/W2294832214","https://openalex.org/W2764433274","https://openalex.org/W2798909945","https://openalex.org/W3157789364","https://openalex.org/W3213084269","https://openalex.org/W6678356664","https://openalex.org/W6750968397","https://openalex.org/W7048190923"],"related_works":["https://openalex.org/W2099244661","https://openalex.org/W2003786218","https://openalex.org/W3062287","https://openalex.org/W2097753256","https://openalex.org/W4313549635","https://openalex.org/W2380390332","https://openalex.org/W2376104713","https://openalex.org/W2083746907","https://openalex.org/W2183938881","https://openalex.org/W2176617845"],"abstract_inverted_index":{"Matrix":[0],"transposition":[1,26],"is":[2,62],"an":[3],"essential":[4],"mathematical":[5],"operation":[6],"broadly":[7],"used":[8,52],"in":[9,28,70],"many":[10],"scientific":[11],"and":[12,55,136,146],"engineering":[13],"domains.":[14],"In":[15,59,115],"this":[16],"paper,":[17],"we":[18,81,117,128],"present":[19,118],"a":[20,45,66,72,119],"new":[21],"approach":[22],"to":[23,35,39,53,64,111],"the":[24,101,144],"matrix":[25,57,98],"problem":[27],"massively":[29],"parallel":[30],"computing":[31],"environments.":[32],"We":[33],"propose":[34],"utilize":[36],"recursive":[37],"functions":[38,88],"translate":[40],"worker":[41],"(thread)":[42],"coordinates":[43],"on":[44,76,134],"grid":[46,67],"so":[47,89],"that":[48,90],"they":[49],"can":[50,82,94,108],"be":[51,109],"locate":[54],"transpose":[56],"elements.":[58],"principal,":[60],"it":[61,84],"possible":[63],"define":[65],"of":[68,122,143],"threads":[69],"such":[71],"way":[73],"that,":[74],"based":[75],"their":[77],"uniquely":[78],"assigned":[79],"index,":[80],"decompose":[83],"using":[85],"above":[86],"mentioned":[87],"each":[91],"individual":[92],"thread":[93],"exchange":[95],"two":[96],"relevant":[97],"elements":[99],"across":[100],"main":[102],"diagonal.":[103],"Currently,":[104],"our":[105,123,138],"in-place":[106,145],"method":[107],"applied":[110],"arbitrary":[112],"square":[113],"matrices.":[114],"addition,":[116],"basic":[120],"implementation":[121],"algorithm":[124],"for":[125,149],"CUDA.":[126,150],"Finally,":[127],"demonstrate":[129],"initial":[130],"performance":[131],"tests":[132],"performed":[133],"GPU":[135],"compare":[137],"results":[139],"with":[140],"naive":[141],"versions":[142],"out-of-place":[147],"algorithms":[148]},"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
