{"id":"https://openalex.org/W7128819700","doi":"https://doi.org/10.48550/arxiv.2602.11562","title":"LASER: An Efficient Target-Aware Segmented Attention Framework for End-to-End Long Sequence Modeling","display_name":"LASER: An Efficient Target-Aware Segmented Attention Framework for End-to-End Long Sequence Modeling","publication_year":2026,"publication_date":"2026-02-12","ids":{"openalex":"https://openalex.org/W7128819700","doi":"https://doi.org/10.48550/arxiv.2602.11562"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.11562","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11562","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.11562","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125912845","display_name":"Tianhe Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lin, Tianhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106364476","display_name":"Ziwei Xiong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiong, Ziwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125931694","display_name":"Baoyuan Ou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ou, Baoyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125891420","display_name":"Yingjie Qin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Yingjie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125965510","display_name":"Lai Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Lai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125904076","display_name":"Xiaocheng Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Xiaocheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125964700","display_name":"Yao Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125975690","display_name":"Zhiyong Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhiyong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125943149","display_name":"Tao Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Tao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125980895","display_name":"Yubin Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yubin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125996731","display_name":"Di Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Di","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5125912845"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.33469998836517334,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.33469998836517334,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.1606999933719635,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.05719999969005585,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.666100025177002},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.49540001153945923},{"id":"https://openalex.org/keywords/lift","display_name":"Lift (data mining)","score":0.47040000557899475},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.46959999203681946},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4124000072479248},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.3822000026702881},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.3675000071525574},{"id":"https://openalex.org/keywords/online-model","display_name":"Online model","score":0.3564999997615814}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8263999819755554},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.666100025177002},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.49540001153945923},{"id":"https://openalex.org/C139002025","wikidata":"https://www.wikidata.org/wiki/Q3001212","display_name":"Lift (data mining)","level":2,"score":0.47040000557899475},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.46959999203681946},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4124000072479248},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.39969998598098755},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.3822000026702881},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.3675000071525574},{"id":"https://openalex.org/C2777851325","wikidata":"https://www.wikidata.org/wiki/Q7094102","display_name":"Online model","level":2,"score":0.3564999997615814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3544999957084656},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35190001130104065},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3492000102996826},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.30070000886917114},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.2904999852180481},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2833000123500824},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.27309998869895935},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2603999972343445},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.11562","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11562","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.11562","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11562","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5969695448875427}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Modeling":[0],"ultra-long":[1],"user":[2,42,92,120,144],"behavior":[3],"sequences":[4],"is":[5],"pivotal":[6],"for":[7,90],"capturing":[8],"evolving":[9],"and":[10,44,65,107,118,230,239],"lifelong":[11],"interests":[12],"in":[13,21,228,234],"modern":[14],"recommendation":[15],"systems.":[16],"However,":[17],"deploying":[18],"such":[19],"models":[20],"real-time":[22,117],"industrial":[23],"environments":[24],"faces":[25],"a":[26,60,85,96,127,148,155,164,225,231],"strict":[27],"\"Latency":[28],"Wall\",":[29],"constrained":[30],"by":[31,105,110,139],"two":[32,76],"distinct":[33],"bottlenecks:":[34],"the":[35,45,73,135,140,192],"high":[36,182],"I/O":[37],"latency":[38,104],"of":[39,49,143,194],"retrieving":[40],"massive":[41],"histories":[43],"quadratic":[46],"computational":[47,136,183],"complexity":[48,193],"standard":[50],"attention":[51],"mechanisms.":[52],"To":[53],"break":[54],"these":[55,173],"bottlenecks,":[56],"we":[57],"present":[58],"LASER,":[59],"full-stack":[61],"optimization":[62],"framework":[63],"developed":[64],"deployed":[66],"at":[67],"Xiaohongshu":[68],"(RedNote).":[69],"Our":[70],"approach":[71],"tackles":[72],"challenges":[74],"through":[75],"complementary":[77],"innovations:":[78],"(1)":[79],"System":[80],"efficiency:":[81,124],"We":[82,125],"introduce":[83],"SeqVault,":[84],"unified":[86],"schema-aware":[87],"serving":[88,216],"infrastructure":[89],"long":[91],"histories.":[93,121],"By":[94],"implementing":[95],"hybrid":[97],"DRAM-SSD":[98],"indexing":[99],"strategy,":[100],"SeqVault":[101],"reduces":[102],"retrieval":[103],"50%":[106],"CPU":[108],"usage":[109],"75%,":[111],"ensuring":[112],"millisecond-level":[113],"access":[114],"to":[115,133,158,176],"full":[116],"life-cycle":[119],"(2)":[122],"Algorithmic":[123],"propose":[126],"Segmented":[128],"Target":[129,168],"Attention":[130,169],"(STA)":[131],"mechanism":[132,157],"address":[134],"overhead.":[137],"Motivated":[138],"inherent":[141],"sparsity":[142],"interests,":[145],"STA":[146],"employs":[147],"sigmoid-based":[149],"gating":[150],"strategy":[151],"that":[152,205],"acts":[153],"as":[154],"silence":[156],"filter":[159],"out":[160],"noisy":[161],"items.":[162],"Subsequently,":[163],"lightweight":[165],"Global":[166],"Stacked":[167],"(GSTA)":[170],"module":[171],"refines":[172],"compressed":[174],"segments":[175],"capture":[177],"cross-segment":[178],"dependencies":[179],"without":[180],"incurring":[181],"costs.":[184],"This":[185],"design":[186],"performs":[187],"effective":[188],"sequence":[189],"compression,":[190],"reducing":[191],"long-sequence":[195],"modeling":[196],"while":[197],"preserving":[198],"critical":[199],"signals.":[200],"Extensive":[201],"offline":[202],"evaluations":[203],"demonstrate":[204],"LASER":[206,223],"consistently":[207],"outperforms":[208],"state-of-the-art":[209],"baselines.":[210],"In":[211],"large-scale":[212],"online":[213],"A/B":[214],"testing":[215],"over":[217],"100":[218],"million":[219],"daily":[220],"active":[221],"users,":[222],"achieved":[224],"2.36%":[226],"lift":[227,233],"ADVV":[229],"2.08%":[232],"revenue,":[235],"demonstrating":[236],"its":[237],"scalability":[238],"significant":[240],"commercial":[241],"impact.":[242]},"counts_by_year":[],"updated_date":"2026-02-14T06:27:19.455381","created_date":"2026-02-14T00:00:00"}
