{"id":"https://openalex.org/W2157203968","doi":"https://doi.org/10.1109/ipdps.2004.1302943","title":"Host-assisted zero-copy remote memory access communication on InfiniBand","display_name":"Host-assisted zero-copy remote memory access communication on InfiniBand","publication_year":2004,"publication_date":"2004-06-10","ids":{"openalex":"https://openalex.org/W2157203968","doi":"https://doi.org/10.1109/ipdps.2004.1302943","mag":"2157203968"},"language":"en","primary_location":{"id":"doi:10.1109/ipdps.2004.1302943","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2004.1302943","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"18th International Parallel and Distributed Processing Symposium, 2004. Proceedings.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004260847","display_name":"Vinod Tipparaju","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"V. Tipparaju","raw_affiliation_strings":["Pacific Northwest National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, USA","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110262125","display_name":"Gopalakrishnan Santhanaraman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"G. Santhanaraman","raw_affiliation_strings":["Ohio State Uinversity, USA"],"affiliations":[{"raw_affiliation_string":"Ohio State Uinversity, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010719257","display_name":"Jaroslaw Nieplocha","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Nieplocha","raw_affiliation_strings":["Pacific Northwest National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, USA","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024879682","display_name":"Dhabaleswar K. Panda","orcid":"https://orcid.org/0000-0002-0356-1781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"D.K. Panda","raw_affiliation_strings":["Ohio State Uinversity, USA"],"affiliations":[{"raw_affiliation_string":"Ohio State Uinversity, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5004260847"],"corresponding_institution_ids":["https://openalex.org/I142606810"],"apc_list":null,"apc_paid":null,"fwci":5.8218,"has_fulltext":false,"cited_by_count":45,"citation_normalized_percentile":{"value":0.96494014,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"31","last_page":"40"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/infiniband","display_name":"InfiniBand","score":0.9881051778793335},{"id":"https://openalex.org/keywords/remote-direct-memory-access","display_name":"Remote direct memory access","score":0.9280303716659546},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8496769666671753},{"id":"https://openalex.org/keywords/host","display_name":"Host (biology)","score":0.7333412766456604},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5959934592247009},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49925971031188965},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4838804006576538},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.48017969727516174},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.37079572677612305},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.33724021911621094},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.11136487126350403},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.09170347452163696}],"concepts":[{"id":"https://openalex.org/C2781030343","wikidata":"https://www.wikidata.org/wiki/Q922437","display_name":"InfiniBand","level":2,"score":0.9881051778793335},{"id":"https://openalex.org/C130795937","wikidata":"https://www.wikidata.org/wiki/Q2561570","display_name":"Remote direct memory access","level":2,"score":0.9280303716659546},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8496769666671753},{"id":"https://openalex.org/C126831891","wikidata":"https://www.wikidata.org/wiki/Q221673","display_name":"Host (biology)","level":2,"score":0.7333412766456604},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5959934592247009},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49925971031188965},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4838804006576538},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.48017969727516174},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.37079572677612305},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.33724021911621094},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11136487126350403},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.09170347452163696},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/ipdps.2004.1302943","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdps.2004.1302943","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"18th International Parallel and Distributed Processing Symposium, 2004. Proceedings.","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.59.5927","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.59.5927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.emsl.pnl.gov/docs/parsoft/armci/publications/hostassisted.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.6.3417","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.6.3417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://nowlab.cis.ohio-state.edu/projects/mpi-iba/./publication/ipdps04hostassistediba.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332359","display_name":"Office of Science","ror":"https://ror.org/00mmn6b08"},{"id":"https://openalex.org/F4320337506","display_name":"Advanced Scientific Computing Research","ror":"https://ror.org/0012c7r22"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W74523810","https://openalex.org/W1484892604","https://openalex.org/W1580435966","https://openalex.org/W1751637436","https://openalex.org/W1861151562","https://openalex.org/W1951864593","https://openalex.org/W2056999868","https://openalex.org/W2069079195","https://openalex.org/W2112121929","https://openalex.org/W2135342109","https://openalex.org/W2140300123","https://openalex.org/W2149970695","https://openalex.org/W2152719989","https://openalex.org/W2199463396","https://openalex.org/W2541014599","https://openalex.org/W2903691225","https://openalex.org/W2920177565","https://openalex.org/W4241489583","https://openalex.org/W4248885950","https://openalex.org/W4285719527","https://openalex.org/W6628811474","https://openalex.org/W6631615826","https://openalex.org/W6637644149","https://openalex.org/W6639223761","https://openalex.org/W6728663354"],"related_works":["https://openalex.org/W1978254186","https://openalex.org/W4245217724","https://openalex.org/W4390917331","https://openalex.org/W1984788566","https://openalex.org/W4253931064","https://openalex.org/W3166154920","https://openalex.org/W2154082760","https://openalex.org/W1964981582","https://openalex.org/W4282599985","https://openalex.org/W2139382794"],"abstract_inverted_index":{"Summary":[0],"form":[1],"only":[2],"given.":[3],"The":[4,62,228],"remote":[5],"memory":[6],"access":[7],"(RMA)":[8],"is":[9],"an":[10,87],"increasingly":[11],"important":[12],"communication":[13,22,84],"model":[14],"due":[15,181],"to":[16,100,161,177,182,191,216,237],"its":[17],"excellent":[18,88,245],"potential":[19],"for":[20,116,133,163,212,218],"overlapping":[21],"and":[23,25,85,109,118,126,208,214,231,243],"computations":[24],"achieving":[26,82],"high":[27,202],"performance":[28,143],"on":[29],"modern":[30],"networks":[31],"with":[32,92],"RDMA":[33],"hardware":[34],"such":[35],"as":[36,139,141,189],"Infiniband.":[37],"RMA":[38,55],"plays":[39],"a":[40,102,110,119,127,200],"vital":[41],"role":[42],"in":[43,186,220],"supporting":[44,86],"the":[45,68,77,142,145,150,153,164,170,192],"emerging":[46],"global":[47],"address":[48],"space":[49],"programming":[50],"models.":[51],"We":[52,167],"describe":[53],"how":[54],"can":[56,72,157],"be":[57,73],"implemented":[58,74],"efficiently":[59,75],"over":[60],"InfiniBand.":[61],"capabilities":[63],"not":[64],"offered":[65],"directly":[66],"by":[67],"Infiniband":[69],"verb":[70],"layer":[71],"using":[76],"novel":[78],"host-assisted":[79,174],"approach":[80,156,188],"while":[81],"zero-copy":[83],"overlap":[89,205,211],"of":[90,106,113,123,130,144,173,204,206,222,240],"computation":[91,207],"communication.":[93,209],"For":[94,149],"contiguous":[95,165,213],"data":[96],"we":[97],"are":[98,137],"able":[99],"achieve":[101],"small":[103,120],"message":[104,121,224],"latency":[105,122],"6/spl":[107],"mu/s":[108,125],"peak":[111,128],"bandwidth":[112,129,159],"830":[114],"MB/s":[115],"'put'":[117],"12/spl":[124],"765":[131],"Megabytes":[132],"'get'.":[134],"These":[135],"numbers":[136],"almost":[138],"good":[140],"native":[146],"VAPI":[147],"layer.":[148],"noncontiguous":[151,219],"data,":[152],"host":[154,184],"assisted":[155],"deliver":[158],"close":[160],"that":[162],"data.":[166],"also":[168,198],"demonstrate":[169],"superior":[171],"tolerance":[172],"data-transfer":[175],"operations":[176],"CPU":[178],"intensive":[179],"tasks":[180],"minimum":[183],"involvement":[185],"our":[187,241],"compared":[190],"traditional":[193],"host-based":[194],"approach.":[195],"Our":[196],"implementation":[197],"supports":[199],"very":[201],"degree":[203],"99%":[210],"up":[215],"95%":[217],"case":[221],"large":[223],"sizes":[225],"were":[226,235],"achieved.":[227],"NAS":[229],"MG":[230],"matrix":[232],"multiplication":[233],"benchmarks":[234],"used":[236],"validate":[238],"effectiveness":[239],"approach,":[242],"demonstrated":[244],"overall":[246],"performance.":[247]},"counts_by_year":[{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
