{"id":"https://openalex.org/W7124159067","doi":"https://doi.org/10.1109/ton.2025.3649068","title":"Cached Model-as-a-Resource: Provisioning Large Language Model Agents for Edge Intelligence in Space\u2013Air\u2013Ground Integrated Networks","display_name":"Cached Model-as-a-Resource: Provisioning Large Language Model Agents for Edge Intelligence in Space\u2013Air\u2013Ground Integrated Networks","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7124159067","doi":"https://doi.org/10.1109/ton.2025.3649068"},"language":"en","primary_location":{"id":"doi:10.1109/ton.2025.3649068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ton.2025.3649068","pdf_url":null,"source":{"id":"https://openalex.org/S5407042750","display_name":"IEEE Transactions on Networking","issn_l":"2998-4157","issn":["2998-4157"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Networking","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123045587","display_name":"Minrui Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Minrui Xu","raw_affiliation_strings":["College of Computing and Data Science, Nanyang Technological University, Jurong West, Singapore"],"affiliations":[{"raw_affiliation_string":"College of Computing and Data Science, Nanyang Technological University, Jurong West, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123017365","display_name":"Dusit Niyato","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dusit Niyato","raw_affiliation_strings":["College of Computing and Data Science, Nanyang Technological University, Jurong West, Singapore"],"affiliations":[{"raw_affiliation_string":"College of Computing and Data Science, Nanyang Technological University, Jurong West, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123047267","display_name":"Hongliang Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongliang Zhang","raw_affiliation_strings":["School of Electronics, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106275656","display_name":"Jiawen Kang","orcid":null},"institutions":[{"id":"https://openalex.org/I139024713","display_name":"Guangdong University of Technology","ror":"https://ror.org/04azbjn80","country_code":"CN","type":"education","lineage":["https://openalex.org/I139024713"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiawen Kang","raw_affiliation_strings":["School of Automation, Guangdong University of Technology, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Guangdong University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I139024713"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005327587","display_name":"Zehui Xiong","orcid":"https://orcid.org/0000-0002-4440-941X"},"institutions":[{"id":"https://openalex.org/I126231945","display_name":"Queen's University Belfast","ror":"https://ror.org/00hswnk62","country_code":"GB","type":"education","lineage":["https://openalex.org/I126231945"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zehui Xiong","raw_affiliation_strings":["Electrical Engineering and Computer Science (EEECS), School of Electronics, Queen&#x2019;s University Belfast, Belfast, U.K"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering and Computer Science (EEECS), School of Electronics, Queen&#x2019;s University Belfast, Belfast, U.K","institution_ids":["https://openalex.org/I126231945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123054004","display_name":"Shiwen Mao","orcid":null},"institutions":[{"id":"https://openalex.org/I82497590","display_name":"Auburn University","ror":"https://ror.org/02v80fc35","country_code":"US","type":"education","lineage":["https://openalex.org/I82497590"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shiwen Mao","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Auburn University, Auburn, AL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Auburn University, Auburn, AL, USA","institution_ids":["https://openalex.org/I82497590"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5123036543","display_name":"Zhu Han","orcid":null},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhu Han","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Houston, Houston, TX, USA","institution_ids":["https://openalex.org/I44461941"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5123045587"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.09393813,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"34","issue":null,"first_page":"2850","last_page":"2864"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.25769999623298645,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.25769999623298645,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.17990000545978546,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.13449999690055847,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/provisioning","display_name":"Provisioning","score":0.802299976348877},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.6700000166893005},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.5856000185012817},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5852000117301941},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.4896000027656555},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.48910000920295715},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4666000008583069},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.4546000063419342}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8144999742507935},{"id":"https://openalex.org/C172191483","wikidata":"https://www.wikidata.org/wiki/Q1071806","display_name":"Provisioning","level":2,"score":0.802299976348877},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.6700000166893005},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.5856000185012817},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5852000117301941},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.4896000027656555},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.48910000920295715},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4666000008583069},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.4546000063419342},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.44369998574256897},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.38029998540878296},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3621000051498413},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.36160001158714294},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.3386000096797943},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C68649174","wikidata":"https://www.wikidata.org/wiki/Q1379116","display_name":"Base station","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2913999855518341},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2831000089645386},{"id":"https://openalex.org/C5038329","wikidata":"https://www.wikidata.org/wiki/Q1142907","display_name":"Core network","level":2,"score":0.2653000056743622},{"id":"https://openalex.org/C72108876","wikidata":"https://www.wikidata.org/wiki/Q844565","display_name":"Transaction processing","level":3,"score":0.26269999146461487},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.26080000400543213},{"id":"https://openalex.org/C2780609101","wikidata":"https://www.wikidata.org/wiki/Q17156588","display_name":"Resource management (computing)","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.2540999948978424}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ton.2025.3649068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ton.2025.3649068","pdf_url":null,"source":{"id":"https://openalex.org/S5407042750","display_name":"IEEE Transactions on Networking","issn_l":"2998-4157","issn":["2998-4157"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Networking","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/212380","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/212380","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W2571380762","https://openalex.org/W2805161269","https://openalex.org/W2889722097","https://openalex.org/W2924948991","https://openalex.org/W3036634962","https://openalex.org/W3083761276","https://openalex.org/W3127207655","https://openalex.org/W3128254715","https://openalex.org/W3129515304","https://openalex.org/W3137905079","https://openalex.org/W4226133071","https://openalex.org/W4285197124","https://openalex.org/W4294068647","https://openalex.org/W4320015749","https://openalex.org/W4381735504","https://openalex.org/W4382246105","https://openalex.org/W4385571886","https://openalex.org/W4386071707","https://openalex.org/W4386451579","https://openalex.org/W4388284731","https://openalex.org/W4390659326","https://openalex.org/W4390828922","https://openalex.org/W4400648761","https://openalex.org/W4401878796","https://openalex.org/W4406800520","https://openalex.org/W4407922851"],"related_works":[],"abstract_inverted_index":{"Edge":[0],"intelligence":[1,22,33,107],"in":[2,30,92,115,196],"space-air-ground":[3],"integrated":[4],"networks":[5],"(SAGINs)":[6],"can":[7,34,199],"enable":[8],"worldwide":[9],"network":[10,194],"coverage":[11,26],"beyond":[12],"geographical":[13],"limitations":[14],"for":[15,41,79,105,121,145,177],"users":[16,42],"to":[17,108,140,191],"access":[18],"ubiquitous":[19,112],"and":[20,27,90,102,111,128,138,154,168,208],"low-latency":[21],"services.":[23],"Facing":[24],"global":[25],"complex":[28,80],"environments":[29],"SAGINs,":[31],"edge":[32,44,106],"provision":[35,109],"large":[36],"language":[37],"models":[38],"(LLMs)":[39],"agents":[40,70,114],"via":[43],"servers":[45],"at":[46],"ground":[47],"base":[48],"stations":[49],"(BSs)":[50],"or":[51],"cloud":[52],"data":[53],"centers":[54],"relayed":[55],"by":[56,203],"satellites.":[57],"As":[58],"LLMs":[59,123],"with":[60,124,151],"billions":[61],"of":[62,159,166],"parameters":[63],"are":[64],"pretrained":[65],"on":[66],"vast":[67],"datasets,":[68],"LLM":[69,113,147],"have":[71],"few-shot":[72],"learning":[73],"capabilities,":[74],"e.g.,":[75],"chain-of-thought":[76],"(CoT)":[77],"prompting":[78,165],"tasks,":[81],"which":[82,198],"raises":[83],"a":[84,99,130,170,184],"new":[85],"trade-off":[86],"between":[87],"resource":[88],"consumption":[89],"performance":[91],"SAGINs.":[93,116],"In":[94],"this":[95],"paper,":[96],"we":[97],"propose":[98,129,169,183],"joint":[100,135],"caching":[101,137],"inference":[103],"framework":[104],"sustainable":[110],"We":[117,182],"introduce":[118],"\u201ccached":[119],"model-as-a-resource\u201d":[120],"offering":[122],"limited":[125],"context":[126],"windows":[127],"novel":[131],"optimization":[132],"framework,":[133],"i.e.,":[134],"model":[136,143,174],"inference,":[139],"utilize":[141],"cached":[142,173],"resources":[144],"provisioning":[146,180],"agent":[148],"services":[149],"along":[150],"communication,":[152],"computing,":[153],"storage":[155],"resources.We":[156],"design":[157],"\u201cage":[158],"thought\u201d":[160],"(AoT)":[161],"considering":[162],"the":[163,179],"CoT":[164],"LLMs,":[167],"least":[171],"AoT":[172],"replacement":[175],"algorithm":[176],"optimizing":[178],"cost.":[181],"deep":[185],"Q-network-based":[186],"modified":[187],"second-bid":[188],"(DQMSB)":[189],"auction":[190],"incentivize":[192],"satellite/ground":[193],"operators":[195],"real-time,":[197],"enhance":[200],"allocation":[201],"efficiency":[202],"23%":[204],"while":[205],"guaranteeing":[206],"strategy-proofness":[207],"being":[209],"free":[210],"from":[211],"adverse":[212],"selection.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2026-01-15T00:00:00"}
