{"id":"https://openalex.org/W4379115905","doi":"https://doi.org/10.23919/date56975.2023.10136962","title":"M5: Multi-modal Multi-task Model Mapping on Multi-FPGA with Accelerator Configuration Search","display_name":"M5: Multi-modal Multi-task Model Mapping on Multi-FPGA with Accelerator Configuration Search","publication_year":2023,"publication_date":"2023-04-01","ids":{"openalex":"https://openalex.org/W4379115905","doi":"https://doi.org/10.23919/date56975.2023.10136962"},"language":"en","primary_location":{"id":"doi:10.23919/date56975.2023.10136962","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date56975.2023.10136962","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Design, Automation &amp; Test in Europe Conference &amp; Exhibition (DATE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5047594193","display_name":"Akshay Karkal Kamath","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Akshay Karkal Kamath","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076244218","display_name":"Stefan Abi-Karam","orcid":"https://orcid.org/0000-0002-6697-8517"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stefan Abi-Karam","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","Georgia Tech Research Institlute, Atlanta, GA, USA","School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"Georgia Tech Research Institlute, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039742451","display_name":"Ashwin Bhat","orcid":"https://orcid.org/0000-0002-6395-9345"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ashwin Bhat","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053022655","display_name":"Cong Hao","orcid":"https://orcid.org/0000-0002-2541-8767"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cong Hao","raw_affiliation_strings":["School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA"],"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]},{"raw_affiliation_string":"School of Electrical and Computer Engineering, Georgia Institute of Technology, Atlanta, GA, USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5047594193"],"corresponding_institution_ids":["https://openalex.org/I130701444"],"apc_list":null,"apc_paid":null,"fwci":0.614,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.68703587,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7857933044433594},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.7165067195892334},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6490839719772339},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5843969583511353},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5512321591377258},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.5226231217384338},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.5124845504760742},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44870203733444214},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.43460798263549805},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42426592111587524},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.42319634556770325},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.38992148637771606},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3817087411880493},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.29804885387420654},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09981149435043335}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7857933044433594},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.7165067195892334},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6490839719772339},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5843969583511353},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5512321591377258},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.5226231217384338},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.5124845504760742},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44870203733444214},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.43460798263549805},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42426592111587524},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.42319634556770325},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38992148637771606},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3817087411880493},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.29804885387420654},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09981149435043335},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/date56975.2023.10136962","is_oa":false,"landing_page_url":"https://doi.org/10.23919/date56975.2023.10136962","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 Design, Automation &amp; Test in Europe Conference &amp; Exhibition (DATE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2063123613","https://openalex.org/W2075164088","https://openalex.org/W2104680817","https://openalex.org/W2115826669","https://openalex.org/W2194775991","https://openalex.org/W2624871570","https://openalex.org/W2810551871","https://openalex.org/W2835955725","https://openalex.org/W2945306514","https://openalex.org/W2962799344","https://openalex.org/W2962953210","https://openalex.org/W2964245886","https://openalex.org/W2969289739","https://openalex.org/W3018693022","https://openalex.org/W3025152414","https://openalex.org/W3109100377","https://openalex.org/W3121413886","https://openalex.org/W3131073178","https://openalex.org/W3143320354","https://openalex.org/W3159273459","https://openalex.org/W3165926952","https://openalex.org/W3168704267","https://openalex.org/W3174183088","https://openalex.org/W3176063860","https://openalex.org/W4293025058","https://openalex.org/W6687483927","https://openalex.org/W6762306914","https://openalex.org/W6777407758","https://openalex.org/W6795879938"],"related_works":["https://openalex.org/W2111241003","https://openalex.org/W2355315220","https://openalex.org/W4200391368","https://openalex.org/W2210979487","https://openalex.org/W2074043759","https://openalex.org/W2316202402","https://openalex.org/W2389214306","https://openalex.org/W1967938402","https://openalex.org/W2386041993","https://openalex.org/W1608572506"],"abstract_inverted_index":{"Recent":[0],"machine":[1],"learning":[2],"(ML)":[3],"models":[4,15,55,89],"have":[5,17],"advanced":[6],"from":[7],"single-modality":[8],"single-task":[9],"to":[10,91,112,131,155,174],"multi-modality":[11],"multi-task":[12],"(MMMT).":[13],"MMMT":[14,54,88,103,140],"typically":[16],"multiple":[18,57,114],"backbones":[19],"of":[20,78,84,159,167],"different":[21],"sizes":[22],"along":[23],"with":[24],"complicated":[25],"connections,":[26],"exposing":[27],"great":[28],"challenges":[29],"for":[30,52,87,107],"hardware":[31],"deployment.":[32],"For":[33,137],"scalable":[34],"and":[35,126,153,162,170],"energy-efficient":[36],"implementations,":[37],"multi-FPGA":[38],"systems":[39],"are":[40],"emerging":[41],"as":[42],"the":[43,49,75,118,134,165,176],"ideal":[44],"design":[45],"choices.":[46],"However,":[47],"finding":[48],"optimal":[50],"solutions":[51],"mapping":[53,62,151],"onto":[56],"FPGAs":[58,172],"is":[59,181],"non-trivial.":[60],"Existing":[61],"algorithms":[63,86],"focus":[64],"on":[65],"either":[66],"streamlined":[67],"linear":[68],"deep":[69],"neural":[70],"network":[71],"architectures":[72],"or":[73],"only":[74],"critical":[76],"path":[77],"simple":[79],"heterogeneous":[80],"models.":[81],"Direct":[82],"extensions":[83],"these":[85,96],"lead":[90,154],"sub-optimal":[92],"solutions.":[93],"To":[94],"address":[95],"shortcomings,":[97],"we":[98],"propose":[99],"M5,":[100],"a":[101],"novel":[102],"Model":[104],"Mapping":[105],"framework":[106],"Multi-FPGA":[108],"platforms.":[109],"In":[110],"addition":[111],"handling":[113],"modalities":[115],"present":[116],"in":[117,164],"models,":[119,141],"M5":[120,146],"can":[121,147],"flexibly":[122],"explore":[123],"accelerator":[124],"configurations":[125],"possible":[127],"resource":[128],"sharing":[129],"opportunities":[130],"significantly":[132],"improve":[133],"system":[135],"performance.":[136],"various":[138],"computation-heavy":[139],"experiment":[142],"results":[143],"demonstrate":[144],"that":[145],"remarkably":[148],"outperform":[149],"existing":[150],"methods":[152],"an":[156],"average":[157],"reduction":[158],"35%,":[160],"62%,":[161],"70%":[163],"number":[166],"low-end,":[168],"mid-end,":[169],"high-end":[171],"required":[173],"achieve":[175],"same":[177],"throughput,":[178],"respectively.":[179],"Code":[180],"publicly":[182],"available":[183],"<sup":[184],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[185],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>":[186],",":[187]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
