{"id":"https://openalex.org/W7118962775","doi":"https://doi.org/10.48550/arxiv.2601.00397","title":"Revati: Transparent GPU-Free Time-Warp Emulation for LLM Serving","display_name":"Revati: Transparent GPU-Free Time-Warp Emulation for LLM Serving","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7118962775","doi":"https://doi.org/10.48550/arxiv.2601.00397"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.00397","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00397","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.00397","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122218941","display_name":"Amey Agrawal","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Agrawal, Amey","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103158453","display_name":"Mayank Yadav","orcid":"https://orcid.org/0000-0003-0302-8108"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yadav, Mayank","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017948355","display_name":"Sukrit Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Sukrit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103533240","display_name":"Anirudha Agrawal","orcid":"https://orcid.org/0009-0009-6949-8859"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Agrawal, Anirudha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122052928","display_name":"Garv Ghai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghai, Garv","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122082382","display_name":"Souradeep Bera","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bera, Souradeep","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043541606","display_name":"Elton M\u00e1rtires Pinto","orcid":"https://orcid.org/0000-0002-1348-4185"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pinto, Elton","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092142175","display_name":"Sirish Gambhira","orcid":"https://orcid.org/0009-0009-3311-8308"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gambhira, Sirish","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122300372","display_name":"Mohammad Adain","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Adain, Mohammad","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122043384","display_name":"Kasra Sohrab","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sohrab, Kasra","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122092624","display_name":"Chus Antonanzas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Antonanzas, Chus","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5048451114","display_name":"Alexey Tumanov","orcid":"https://orcid.org/0009-0005-7862-1477"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tumanov, Alexey","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5122218941"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.5547000169754028,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.5547000169754028,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.15289999544620514,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.08529999852180481,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/emulation","display_name":"Emulation","score":0.7289000153541565},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5144000053405762},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.48159998655319214},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4641000032424927},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.43560001254081726},{"id":"https://openalex.org/keywords/virtual-machine","display_name":"Virtual machine","score":0.3878999948501587},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.3260999917984009},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.3188000023365021},{"id":"https://openalex.org/keywords/network-packet","display_name":"Network packet","score":0.3068000078201294}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8464000225067139},{"id":"https://openalex.org/C149810388","wikidata":"https://www.wikidata.org/wiki/Q5374873","display_name":"Emulation","level":2,"score":0.7289000153541565},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5144000053405762},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4896000027656555},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.48159998655319214},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4641000032424927},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.46059998869895935},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4480000138282776},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.43560001254081726},{"id":"https://openalex.org/C25344961","wikidata":"https://www.wikidata.org/wiki/Q192726","display_name":"Virtual machine","level":2,"score":0.3878999948501587},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3702000081539154},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.3260999917984009},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.3188000023365021},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.31130000948905945},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C120524526","wikidata":"https://www.wikidata.org/wiki/Q1709148","display_name":"Reboot","level":2,"score":0.29030001163482666},{"id":"https://openalex.org/C71559656","wikidata":"https://www.wikidata.org/wiki/Q671298","display_name":"Divide and conquer algorithms","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.28949999809265137},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.27709999680519104},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C513985346","wikidata":"https://www.wikidata.org/wiki/Q270471","display_name":"Virtualization","level":3,"score":0.27300000190734863},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.271699994802475},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C553261973","wikidata":"https://www.wikidata.org/wiki/Q14579","display_name":"Linux kernel","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2574000060558319},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C29140674","wikidata":"https://www.wikidata.org/wiki/Q206637","display_name":"Computer cluster","level":2,"score":0.2515999972820282}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.00397","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00397","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.00397","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.00397","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Deploying":[0],"LLMs":[1],"efficiently":[2],"requires":[3],"testing":[4],"hundreds":[5],"of":[6,22,86],"serving":[7,35,61,78],"configurations,":[8,133],"but":[9,30],"evaluating":[10],"each":[11],"one":[12],"on":[13],"a":[14,40,50,104],"GPU":[15,88,140],"cluster":[16],"takes":[17],"hours":[18],"and":[19,28,119,131],"costs":[20],"thousands":[21],"dollars.":[23],"Discrete-event":[24],"simulators":[25],"are":[26],"faster":[27,137],"cheaper,":[29],"they":[31],"require":[32],"re-implementing":[33],"the":[34],"system's":[36],"control":[37],"logic":[38],"--":[39,94],"burden":[41],"that":[42,53,107],"compounds":[43],"as":[44],"frameworks":[45,79],"evolve.":[46],"We":[47,102],"present":[48],"Revati,":[49],"time-warp":[51],"emulator":[52],"enables":[54],"performance":[55],"modeling":[56],"by":[57,98],"directly":[58],"executing":[59,87],"real":[60,139],"system":[62,68],"code":[63],"at":[64],"simulation-like":[65],"speed.":[66],"The":[67],"intercepts":[69],"CUDA":[70],"API":[71],"calls":[72],"to":[73,80],"virtualize":[74],"device":[75],"management,":[76],"allowing":[77],"run":[81],"without":[82],"physical":[83],"GPUs.":[84],"Instead":[85],"kernels,":[89],"it":[90],"performs":[91],"time":[92,97],"jumps":[93,110],"fast-forwarding":[95],"virtual":[96],"predicted":[99],"kernel":[100],"durations.":[101],"propose":[103],"coordination":[105],"protocol":[106],"synchronizes":[108],"these":[109],"across":[111,128],"distributed":[112],"processes":[113],"while":[114,134],"preserving":[115],"causality.":[116],"On":[117],"vLLM":[118],"SGLang,":[120],"Revati":[121],"achieves":[122],"less":[123],"than":[124,138],"5%":[125],"prediction":[126],"error":[127],"multiple":[129],"models":[130],"parallelism":[132],"running":[135],"5-17x":[136],"execution.":[141]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
