{"id":"https://openalex.org/W3101819589","doi":"https://doi.org/10.13016/egom-sbxg","title":"Study of Fine-Grained, Irregular Parallel Applications on a Many-Core Processor","display_name":"Study of Fine-Grained, Irregular Parallel Applications on a Many-Core Processor","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3101819589","doi":"https://doi.org/10.13016/egom-sbxg","mag":"3101819589"},"language":"en","primary_location":{"id":"mag:3101819589","is_oa":false,"landing_page_url":"https://drum.lib.umd.edu/handle/1903/26626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null},"type":"dissertation","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.13016/egom-sbxg","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041185964","display_name":"James Edwards","orcid":"https://orcid.org/0000-0001-6958-5367"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Edwards, James Alexander","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5041185964"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9747999906539917,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.655536949634552},{"id":"https://openalex.org/keywords/many-core","display_name":"Many core","score":0.6286253929138184},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6088836789131165},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.5431848764419556},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.5318676233291626},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3324744403362274},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3254064917564392},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.08163142204284668}],"concepts":[{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.655536949634552},{"id":"https://openalex.org/C3020431745","wikidata":"https://www.wikidata.org/wiki/Q25325220","display_name":"Many core","level":2,"score":0.6286253929138184},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6088836789131165},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.5431848764419556},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.5318676233291626},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3324744403362274},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3254064917564392},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.08163142204284668}],"mesh":[],"locations_count":2,"locations":[{"id":"mag:3101819589","is_oa":false,"landing_page_url":"https://drum.lib.umd.edu/handle/1903/26626","pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null},{"id":"doi:10.13016/egom-sbxg","is_oa":true,"landing_page_url":"https://doi.org/10.13016/egom-sbxg","pdf_url":null,"source":{"id":"https://openalex.org/S4306402644","display_name":"Digital Repository at the University of Maryland (University of Maryland College Park)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66946132","host_organization_name":"University of Maryland, College Park","host_organization_lineage":["https://openalex.org/I66946132"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"thesis"}],"best_oa_location":{"id":"doi:10.13016/egom-sbxg","is_oa":true,"landing_page_url":"https://doi.org/10.13016/egom-sbxg","pdf_url":null,"source":{"id":"https://openalex.org/S4306402644","display_name":"Digital Repository at the University of Maryland (University of Maryland College Park)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66946132","host_organization_name":"University of Maryland, College Park","host_organization_lineage":["https://openalex.org/I66946132"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"thesis"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W50833228","https://openalex.org/W99581410","https://openalex.org/W2786055806","https://openalex.org/W145939741","https://openalex.org/W2789127250","https://openalex.org/W1554811168","https://openalex.org/W1572074260","https://openalex.org/W2469322671","https://openalex.org/W2157819149","https://openalex.org/W2035282552","https://openalex.org/W2255048617","https://openalex.org/W2281910244"],"abstract_inverted_index":{"This":[0,307],"dissertation":[1],"demonstrates":[2],"the":[3,16,30,54,59,76,148,152,166,249,268,282,311,316,366,378,422,493],"possibility":[4],"of":[5,12,45,62,68,91,109,117,150,155,173,190,214,237,254,272,284,315,323,368,372,377,381,396,427,440,497,504],"obtaining":[6],"strong":[7],"speedups":[8,67,90,162,236,496],"for":[9,134,198,209,241,245,424,436,495],"a":[10,63,81,124,144,174,180,191,217,285,292,299,320,326,404,414,425,444,502],"variety":[11,503],"parallel":[13,20,49,118,145,188,207],"applications":[14,369,459],"versus":[15,247],"best":[17,77],"serial":[18,47,78,171],"and":[19,48,51,212,220,234,243,348,391,420],"implementations":[21],"on":[22,72,163,179,232,281,310,467,473],"commodity":[23],"platforms.":[24],"These":[25],"results":[26,289,511],"were":[27],"obtained":[28],"using":[29,80],"PRAM-inspired":[31],"Explicit":[32],"Multi-Threading":[33],"(XMT)":[34],"many-core":[35,286,294],"computing":[36,302],"platform,":[37,319],"which":[38,324],"is":[39,325,453],"designed":[40],"to":[41,70,75,93,136,147,239,334,339,352,434,499],"efficiently":[42],"support":[43],"execution":[44],"both":[46],"code":[50,133],"switching":[52],"between":[53],"two.":[55],"Biconnectivity:":[56],"For":[57,97],"finding":[58],"biconnected":[60],"components":[61,154,176,193],"graph,":[64],"we":[65,100,128,229,266,357,364,412,479],"demonstrate":[66,101,421],"9x":[69],"33x":[71],"XMT":[73,103,164,233,317],"relative":[74],"algorithm":[79,177,194],"relatively":[82],"modest":[83],"silicon":[84,113,277],"budget.":[85],"Further":[86],"evidence":[87],"suggests":[88],"that":[89,102,270,291,331,371,483,509],"21x":[92],"48x":[94],"are":[95],"possible.":[96],"graph":[98],"connectivity,":[99],"outperforms":[104],"two":[105],"contemporary":[106],"NVIDIA":[107],"GPUs":[108,135],"similar":[110],"or":[111],"greater":[112],"area.":[114],"Prior":[115],"studies":[116],"biconnectivity":[119,132,138],"algorithms":[120,208],"achieved":[121],"at":[122],"most":[123,431,465],"4x":[125],"speedup,":[126],"but":[127],"could":[129,296],"not":[130],"find":[131],"compare":[137],"against":[139],"them.":[140],"Triconnectivity:":[141],"We":[142,159,203,491,507],"present":[143,204],"solution":[146],"problem":[149,389,457,462,505],"determining":[151],"triconnected":[153,175,192],"an":[156,264,418,438,454],"undirected":[157],"graph.":[158],"obtain":[160],"significant":[161],"over":[165,216,429],"only":[167],"published":[168,197],"optimal":[169],"(linear-time)":[170],"implementation":[172,189,253,439],"running":[178],"modern":[181],"CPU.":[182],"To":[183,224,401],"our":[184],"knowledge,":[185],"no":[186],"other":[187],"has":[195,471],"been":[196],"any":[199],"platform.":[200],"Burrows-Wheeler":[201,210,255],"compression:":[202],"novel":[205],"work-optimal":[206],"compression":[211],"decompression":[213],"strings":[215],"constant":[218],"alphabet":[219],"their":[221],"empirical":[222],"evaluation.":[223],"validate":[225],"these":[226,510],"theoretical":[227],"algorithms,":[228],"implement":[230],"them":[231],"show":[235,290,492],"up":[238,486,498],"25x":[240],"compression,":[242],"13x":[244],"decompression,":[246],"bzip2,":[248],"de":[250],"facto":[251],"standard":[252],"compression.":[256],"Fast":[257],"Fourier":[258],"transform":[259],"(FFT):":[260],"Using":[261],"FFT":[262],"as":[263],"example,":[265],"examine":[267],"impact":[269],"adoption":[271],"some":[273,341,384],"enabling":[274],"technologies,":[275],"including":[276,360],"photonics,":[278],"would":[279],"have":[280],"performance":[283],"architecture.":[287],"The":[288],"single-chip":[293],"processor":[295],"potentially":[297],"outperform":[298],"large":[300],"high-performance":[301],"cluster.":[303],"Boosted":[304],"decision":[305,442],"trees:":[306],"chapter":[308],"focuses":[309],"hybrid":[312,354,405],"memory":[313,336,346,355,406],"architecture":[314,347,407,419],"computer":[318,415],"key":[321],"part":[322],"flexible":[327],"all-to-all":[328],"interconnection":[329],"network":[330],"connects":[332],"processors":[333],"shared":[335],"modules.":[337],"First,":[338],"understand":[340],"recent":[342],"advances":[343],"in":[344,392,460],"GPU":[345,433],"how":[349,403],"they":[350],"relate":[351],"this":[353],"architecture,":[356],"use":[358],"microbenchmarks":[359],"list":[361],"ranking.":[362],"Then,":[363],"contrast":[365],"scalability":[367,379],"with":[370,416,458],"routines.":[373],"In":[374],"particular,":[375],"regardless":[376],"needs":[380],"full":[382],"applications,":[383,411],"routines":[385],"may":[386],"involve":[387],"smaller":[388,394],"sizes,":[390],"particular":[393],"levels":[395],"parallelism,":[397],"perhaps":[398],"even":[399],"serial.":[400],"see":[402],"can":[408,484],"benefit":[409],"such":[410,417],"simulate":[413],"potential":[423,494],"speedup":[426],"3.3X":[428],"NVIDIA's":[430],"powerful":[432],"date":[435],"XGBoost,":[437],"boosted":[441],"trees,":[443],"timely":[445],"machine":[446],"learning":[447],"approach.":[448],"Boolean":[449],"satisfiability":[450],"(SAT):":[451],"SAT":[452,469,489],"important":[455],"performance-hungry":[456],"many":[461],"domains.":[463],"However,":[464],"work":[466],"parallelizing":[468],"solvers":[470],"focused":[472],"coarse-grained,":[474],"mostly":[475],"embarrassing":[476],"parallelism.":[477],"Here,":[478],"study":[480],"fine-grained":[481],"parallelism":[482],"speed":[485],"existing":[487],"sequential":[488],"solvers.":[490],"382X":[500],"across":[501],"instances.":[506],"hope":[508],"will":[512],"stimulate":[513],"future":[514],"research.":[515]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
