{"id":"https://openalex.org/W4410321819","doi":"https://doi.org/10.1145/3725798.3725807","title":"Efficient Parallel Implementation of Non-Local Means Algorithm on GPU","display_name":"Efficient Parallel Implementation of Non-Local Means Algorithm on GPU","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4410321819","doi":"https://doi.org/10.1145/3725798.3725807"},"language":"en","primary_location":{"id":"doi:10.1145/3725798.3725807","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725807","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725807","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725807","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100636346","display_name":"Xiang Li","orcid":"https://orcid.org/0000-0001-6933-6491"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiang Li","raw_affiliation_strings":["Nanjing university, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing university, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011965834","display_name":"Qiong Chang","orcid":"https://orcid.org/0000-0002-4447-0480"},"institutions":[{"id":"https://openalex.org/I4400009020","display_name":"Institute of Science Tokyo","ror":"https://ror.org/05dqf9946","country_code":null,"type":"education","lineage":["https://openalex.org/I4400009020"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Qiong Chang","raw_affiliation_strings":["Institute of Science Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Institute of Science Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I4400009020"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100395668","display_name":"Yun Li","orcid":"https://orcid.org/0000-0003-1753-7317"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Li","raw_affiliation_strings":["Nanjing university, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing university, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026559426","display_name":"Jun Miyazaki","orcid":"https://orcid.org/0000-0002-3038-7678"},"institutions":[{"id":"https://openalex.org/I4400009020","display_name":"Institute of Science Tokyo","ror":"https://ror.org/05dqf9946","country_code":null,"type":"education","lineage":["https://openalex.org/I4400009020"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jun Miyazaki","raw_affiliation_strings":["Institute of Science Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Institute of Science Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I4400009020"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100636346"],"corresponding_institution_ids":["https://openalex.org/I881766915"],"apc_list":null,"apc_paid":null,"fwci":2.7712,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.90099438,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"55","last_page":"61"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10500","display_name":"Sparse and Compressive Sensing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8051694631576538},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7136774063110352},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.45835721492767334},{"id":"https://openalex.org/keywords/parallel-algorithm","display_name":"Parallel algorithm","score":0.42146438360214233},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3844663202762604}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8051694631576538},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7136774063110352},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.45835721492767334},{"id":"https://openalex.org/C120373497","wikidata":"https://www.wikidata.org/wiki/Q1087987","display_name":"Parallel algorithm","level":2,"score":0.42146438360214233},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3844663202762604}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3725798.3725807","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725807","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725807","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3725798.3725807","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3725798.3725807","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3725798.3725807","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 17th Workshop on General Purpose Processing Using GPU","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1069223013","display_name":null,"funder_award_id":"JSPS KAKENHI","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G1976657664","display_name":null,"funder_award_id":"23K28091","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G3459562248","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G4636223006","display_name":null,"funder_award_id":"JSPS KAK","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"},{"id":"https://openalex.org/G8430481527","display_name":null,"funder_award_id":"Number","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4410321819.pdf","grobid_xml":"https://content.openalex.org/works/W4410321819.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W2097073572","https://openalex.org/W2137901785","https://openalex.org/W2142592339","https://openalex.org/W2267520283","https://openalex.org/W2339758283","https://openalex.org/W2405535704","https://openalex.org/W2793775504","https://openalex.org/W2956015785","https://openalex.org/W2963091558","https://openalex.org/W2972158684","https://openalex.org/W2981899103","https://openalex.org/W3004947139","https://openalex.org/W3013302728","https://openalex.org/W3035006120","https://openalex.org/W3047011367","https://openalex.org/W3104467360","https://openalex.org/W3116606340","https://openalex.org/W3134030220","https://openalex.org/W3159911942","https://openalex.org/W3166036439","https://openalex.org/W4205102828","https://openalex.org/W4285697865","https://openalex.org/W4328053402","https://openalex.org/W4378573650","https://openalex.org/W4390317766","https://openalex.org/W4401818004"],"related_works":["https://openalex.org/W2005148983","https://openalex.org/W2012954338","https://openalex.org/W2096672917","https://openalex.org/W2392023973","https://openalex.org/W2032508741","https://openalex.org/W2363538625","https://openalex.org/W2070865675","https://openalex.org/W4297775710","https://openalex.org/W2071635571","https://openalex.org/W4212854884"],"abstract_inverted_index":{"The":[0],"Non-Local":[1],"Means":[2],"(NLM)":[3],"algorithm":[4,56],"has":[5,25],"become":[6],"a":[7,112,152],"crucial":[8],"preprocessing":[9],"technique":[10],"for":[11,91,108],"image":[12,155],"processing":[13],"due":[14],"to":[15,28,71,84,100,123,136],"its":[16,58],"effectiveness":[17],"in":[18,32,88],"denoising":[19],"while":[20],"preserving":[21],"fine":[22],"details.This":[23],"method":[24],"been":[26],"proven":[27],"be":[29],"highly":[30],"efficient":[31,67],"high-demand":[33],"tasks":[34],"within":[35],"industrial":[36],"applications":[37],"such":[38],"as":[39,120],"medical":[40],"imaging":[41],"and":[42,48,75,125],"remote":[43],"sensing.However,":[44],"the":[45,54,95,147],"computation":[46,103],"intensive":[47,51],"memory":[49,76,119],"access":[50],"characteristics":[52],"of":[53,144,154],"NLM":[55],"hinder":[57],"real-time":[59],"applications.To":[60],"address":[61],"this":[62],"issue,":[63],"we":[64,93,110],"propose":[65],"an":[66,121,141],"GPU":[68,117],"parallel":[69],"kernel":[70,78,139],"minimize":[72],"redundant":[73,86],"computations":[74,87],"accesses.The":[77],"integrates":[79],"two":[80,89],"nested":[81],"reuse":[82,101,126],"strategies":[83],"handle":[85],"dimensions:":[90],"columns,":[92],"leverage":[94],"fast":[96],"data":[97],"exchange":[98],"mechanism":[99],"column":[102],"results":[104,132],"via":[105],"on-chip":[106],"registers;":[107],"rows,":[109],"use":[111],"sliding":[113],"window":[114],"strategy,":[115],"utilizing":[116],"global":[118],"intermediary":[122],"store":[124],"similarity":[127],"values":[128],"between":[129],"filtered":[130],"rows.Experimental":[131],"demonstrate":[133],"that,":[134],"compared":[135],"OpenCV,":[137],"our":[138],"achieves":[140],"average":[142],"speedup":[143],"4.5x":[145],"on":[146],"RTX":[148],"3080":[149],"platform":[150],"across":[151],"range":[153],"data,":[156],"showcasing":[157],"exceptional":[158],"performance.":[159],"CCS":[160],"Concepts":[161]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-10-10T00:00:00"}
