{"id":"https://openalex.org/W7154513969","doi":"https://doi.org/10.48550/arxiv.2604.12278","title":"LightMat-HP: A Photonic-Electronic System for Accelerating General Matrix Multiplication With Configurable Precision","display_name":"LightMat-HP: A Photonic-Electronic System for Accelerating General Matrix Multiplication With Configurable Precision","publication_year":2026,"publication_date":"2026-04-14","ids":{"openalex":"https://openalex.org/W7154513969","doi":"https://doi.org/10.48550/arxiv.2604.12278"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.12278","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12278","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.12278","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133721451","display_name":"Hailong Gong","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gong, Hailong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133668270","display_name":"Haibo Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Haibo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039459434","display_name":"Amanda S. Barnard","orcid":"https://orcid.org/0000-0002-4784-2382"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Barnard, Amanda S.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133675061","display_name":"Mahbub Hassan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hassan, Mahbub","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133553581","display_name":"Matt Woolley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Woolley, Matt","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5014716105","display_name":"Rajkumar Buyya","orcid":"https://orcid.org/0000-0001-9754-6496"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Buyya, Rajkumar","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5133721451"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.9200999736785889,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.9200999736785889,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10299","display_name":"Photonic and Optical Devices","score":0.04170000180602074,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10232","display_name":"Optical Network Technologies","score":0.007799999788403511,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/photonics","display_name":"Photonics","score":0.717199981212616},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.6952999830245972},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.6532999873161316},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.5073999762535095},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.46790000796318054},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.43939998745918274},{"id":"https://openalex.org/keywords/optical-computing","display_name":"Optical computing","score":0.41290000081062317},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.3628999888896942}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7196000218391418},{"id":"https://openalex.org/C20788544","wikidata":"https://www.wikidata.org/wiki/Q467054","display_name":"Photonics","level":2,"score":0.717199981212616},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.6952999830245972},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.6532999873161316},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.5073999762535095},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.46790000796318054},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.43939998745918274},{"id":"https://openalex.org/C148204187","wikidata":"https://www.wikidata.org/wiki/Q176541","display_name":"Optical computing","level":2,"score":0.41290000081062317},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.3628999888896942},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.3513999879360199},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.33959999680519104},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.32280001044273376},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.3125},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.3050000071525574},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.30480000376701355},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3034999966621399},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.29170000553131104},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.2858999967575073},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.12278","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12278","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.12278","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12278","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.903911292552948}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Matrix":[0],"multiplication":[1,91,124,135,149],"is":[2,20,151],"a":[3,32,79,121,165,185],"fundamental":[4],"kernel":[5],"in":[6,69,136],"large-scale":[7,174],"artificial":[8],"intelligence":[9],"and":[10,26,42,62,169,184,192,198,212],"scientific":[11],"computing,":[12],"but":[13],"its":[14,37,171,204],"performance":[15,172],"on":[16,164],"conventional":[17],"electronic":[18],"accelerators":[19],"increasingly":[21],"constrained":[22],"by":[23],"memory":[24],"bandwidth":[25],"energy":[27,193],"efficiency.":[28],"Photonic":[29],"computing":[30,82,167],"offers":[31],"promising":[33],"alternative":[34],"due":[35],"to":[36,53,102,141,154,203],"ultra-high":[38],"bandwidth,":[39],"massive":[40],"parallelism,":[41],"low":[43,132],"power":[44],"dissipation.":[45],"However,":[46],"most":[47],"existing":[48],"photonic":[49,117,123,134,166,187,207],"systems":[50],"are":[51],"limited":[52],"low-precision":[54],"computation":[55],"because":[56],"of":[57,88,116,131,157],"analog":[58],"optical":[59],"modulation":[60],"constraints":[61],"noise":[63],"accumulation,":[64],"which":[65],"restricts":[66],"their":[67],"applicability":[68],"precision-critical":[70],"workloads.":[71],"To":[72,111],"address":[73],"this":[74],"limitation,":[75],"we":[76,119],"propose":[77,120],"LightMat-HP,":[78],"hybrid":[80],"photonic-electronic":[81],"system":[83],"that":[84,126,179],"enables":[85],"end-to-end":[86],"acceleration":[87],"general":[89],"matrix":[90,148,200],"with":[92,138],"configurable":[93],"computational":[94,104],"precision.":[95],"LightMat-HP":[96,163,180],"adopts":[97],"block":[98],"floating-point":[99],"(BFP)":[100],"arithmetic":[101],"reduce":[103],"complexity":[105],"while":[106],"enabling":[107],"flexible":[108],"precision-performance":[109],"tradeoffs.":[110],"overcome":[112],"the":[113,128],"precision":[114],"limitations":[115],"devices,":[118],"slicing-based":[122],"scheme":[125],"exploits":[127],"high":[129],"accuracy":[130],"bit-width":[133],"combination":[137],"digital":[139],"accumulation":[140],"achieve":[142],"high-precision":[143],"mantissa":[144],"multiplication.":[145],"A":[146],"tile-based":[147],"dataflow":[150],"further":[152],"designed":[153],"support":[155],"matrices":[156],"arbitrary":[158],"sizes.":[159],"We":[160],"experimentally":[161],"validate":[162],"prototype":[168],"evaluate":[170],"through":[173],"simulations.":[175],"The":[176],"results":[177],"demonstrate":[178],"outperforms":[181],"FPGA,":[182],"GPU,":[183],"state-of-the-art":[186],"accelerator":[188],"across":[189],"throughput,":[190],"latency,":[191],"efficiency,":[194],"particularly":[195],"for":[196],"small-":[197],"medium-sized":[199],"multiplications,":[201],"owing":[202],"highly":[205],"parallel":[206],"architecture,":[208],"efficient":[209],"data":[210],"movement,":[211],"slice-based":[213],"BFP":[214],"arithmetic.":[215]},"counts_by_year":[],"updated_date":"2026-04-16T06:09:31.884825","created_date":"2026-04-16T00:00:00"}
