{"id":"https://openalex.org/W4415090695","doi":"https://doi.org/10.1145/3748522.3779854","title":"ReCross: Efficient Embedding Reduction Scheme for In-Memory Computing using ReRAM-Based Crossbar","display_name":"ReCross: Efficient Embedding Reduction Scheme for In-Memory Computing using ReRAM-Based Crossbar","publication_year":2025,"publication_date":"2025-09-12","ids":{"openalex":"https://openalex.org/W4415090695","doi":"https://doi.org/10.1145/3748522.3779854"},"language":"en","primary_location":{"id":"doi:10.1145/3748522.3779854","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3748522.3779854","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 41st ACM/SIGAPP Symposium on Applied Computing","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2509.10627","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090629044","display_name":"Yu\u2010Hong Lai","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lai, Yu-Hong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104192300","display_name":"Chieh-Lin Tsai","orcid":"https://orcid.org/0009-0001-4820-2790"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsai, Chieh-Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033796500","display_name":"Wen Sheng Lim","orcid":"https://orcid.org/0000-0002-2391-8127"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lim, Wen Sheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008331570","display_name":"Han-Wen Hu","orcid":"https://orcid.org/0000-0002-7985-9939"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Han-Wen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056407308","display_name":"Tei\u2010Wei Kuo","orcid":"https://orcid.org/0000-0003-1974-0394"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuo, Tei-Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5073534245","display_name":"Yuan-Hao Chang","orcid":"https://orcid.org/0000-0002-1282-2111"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Yuan-Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5090629044"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24442123,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"333","last_page":"341"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/crossbar-switch","display_name":"Crossbar switch","score":0.8865000009536743},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.8291000127792358},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.5884000062942505},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.5572999715805054},{"id":"https://openalex.org/keywords/resistive-random-access-memory","display_name":"Resistive random-access memory","score":0.5404999852180481},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.5260000228881836},{"id":"https://openalex.org/keywords/in-memory-processing","display_name":"In-Memory Processing","score":0.44699999690055847},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4221000075340271}],"concepts":[{"id":"https://openalex.org/C29984679","wikidata":"https://www.wikidata.org/wiki/Q1929149","display_name":"Crossbar switch","level":2,"score":0.8865000009536743},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.8291000127792358},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7785999774932861},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.5884000062942505},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.5572999715805054},{"id":"https://openalex.org/C182019814","wikidata":"https://www.wikidata.org/wiki/Q1143830","display_name":"Resistive random-access memory","level":3,"score":0.5404999852180481},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.5260000228881836},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5152999758720398},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.44699999690055847},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4221000075340271},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.3993000090122223},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3935000002384186},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.35089999437332153},{"id":"https://openalex.org/C188045654","wikidata":"https://www.wikidata.org/wiki/Q17148339","display_name":"Memory bandwidth","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3116999864578247},{"id":"https://openalex.org/C101722063","wikidata":"https://www.wikidata.org/wiki/Q218825","display_name":"Random access","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C6899612","wikidata":"https://www.wikidata.org/wiki/Q852911","display_name":"Resistive touchscreen","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.27639999985694885},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.2721000015735626},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2718000113964081},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.26840001344680786},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C2994168587","wikidata":"https://www.wikidata.org/wiki/Q5295","display_name":"Random access memory","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C2778820799","wikidata":"https://www.wikidata.org/wiki/Q3454688","display_name":"Cost reduction","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.25780001282691956},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.2549000084400177},{"id":"https://openalex.org/C194080101","wikidata":"https://www.wikidata.org/wiki/Q46306","display_name":"Access time","level":2,"score":0.2533000111579895},{"id":"https://openalex.org/C150072547","wikidata":"https://www.wikidata.org/wiki/Q212923","display_name":"Memristor","level":2,"score":0.25279998779296875}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3748522.3779854","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3748522.3779854","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 41st ACM/SIGAPP Symposium on Applied Computing","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2509.10627","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.10627","pdf_url":"https://arxiv.org/pdf/2509.10627","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2509.10627","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2509.10627","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2509.10627","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2509.10627","pdf_url":"https://arxiv.org/pdf/2509.10627","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deep":[0],"learning-based":[1],"recommendation":[2],"models":[3,24],"(DLRMs)":[4],"are":[5],"widely":[6],"deployed":[7],"in":[8,22,101,155,162],"commercial":[9],"applications":[10],"to":[11,31,41,74,93,166],"enhance":[12,98],"user":[13],"experience.":[14],"However,":[15],"the":[16],"large":[17],"and":[18,36,45,59,78,97,110,117,127,158],"sparse":[19],"embedding":[20,64,103,107],"layers":[21],"these":[23],"impose":[25],"substantial":[26],"memory":[27,33,52],"bandwidth":[28],"bottlenecks":[29],"due":[30],"high":[32],"access":[34,38,51,108],"costs":[35],"irregular":[37],"patterns,":[39],"leading":[40],"increased":[42],"inference":[43],"time":[44,96,157],"energy":[46,99,144,163],"consumption.":[47],"While":[48],"resistive":[49],"random":[50],"(ReRAM)":[53],"based":[54],"crossbars":[55],"offer":[56],"a":[57,134,152,159],"fast":[58],"energy-efficient":[60],"solution":[61],"through":[62],"in-memory":[63,88,130],"reduction":[65,154],"operations,":[66],"naively":[67],"mapping":[68,118],"embeddings":[69,124],"onto":[70],"crossbar":[71,76,112],"arrays":[72],"leads":[73],"poor":[75],"utilization":[77],"thus":[79],"degrades":[80],"performance.":[81],"We":[82],"present":[83],"ReCross,":[84],"an":[85],"efficient":[86],"ReRAM-based":[87],"computing":[89],"(IMC)":[90],"scheme":[91],"designed":[92,136],"minimize":[94],"execution":[95,156],"efficiency":[100,164],"DLRM":[102],"reduction.":[104],"ReCross":[105,150],"co-optimizes":[106],"patterns":[109],"ReRAM":[111],"characteristics":[113],"by":[114],"intelligently":[115],"grouping":[116],"co-occurring":[119],"embeddings,":[120],"replicating":[121],"frequently":[122],"accessed":[123],"across":[125],"crossbars,":[126],"dynamically":[128],"selecting":[129],"processing":[131],"operations":[132],"using":[133],"newly":[135],"dynamic":[137],"switch":[138],"ADC":[139],"circuit":[140],"that":[141,149],"considers":[142],"runtime":[143],"trade-offs.":[145],"Experimental":[146],"results":[147],"demonstrate":[148],"achieves":[151],"3.97x":[153],"6.1x":[160],"improvement":[161],"compared":[165],"state-of-the-art":[167],"IMC":[168],"approaches.":[169]},"counts_by_year":[],"updated_date":"2026-06-10T14:10:52.464848","created_date":"2025-10-12T00:00:00"}
