{"id":"https://openalex.org/W2928077227","doi":"https://doi.org/10.1109/tvt.2019.2909055","title":"Buffer-Aware Streaming in Small-Scale Wireless Networks: A Deep Reinforcement Learning Approach","display_name":"Buffer-Aware Streaming in Small-Scale Wireless Networks: A Deep Reinforcement Learning Approach","publication_year":2019,"publication_date":"2019-04-03","ids":{"openalex":"https://openalex.org/W2928077227","doi":"https://doi.org/10.1109/tvt.2019.2909055","mag":"2928077227"},"language":"en","primary_location":{"id":"doi:10.1109/tvt.2019.2909055","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2019.2909055","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077821665","display_name":"Yashuang Guo","orcid":"https://orcid.org/0000-0001-8870-9046"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yashuang Guo","raw_affiliation_strings":["School of Information and Electronics, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8870-9046","affiliations":[{"raw_affiliation_string":"School of Information and Electronics, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100420016","display_name":"F. Richard Yu","orcid":"https://orcid.org/0000-0003-1006-7594"},"institutions":[{"id":"https://openalex.org/I67031392","display_name":"Carleton University","ror":"https://ror.org/02qtvee93","country_code":"CA","type":"education","lineage":["https://openalex.org/I67031392"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"F. Richard Yu","raw_affiliation_strings":["Department of Systems and Computer Engineering, Carleton University, Ottawa, ON, Canada"],"raw_orcid":"https://orcid.org/0000-0003-1006-7594","affiliations":[{"raw_affiliation_string":"Department of Systems and Computer Engineering, Carleton University, Ottawa, ON, Canada","institution_ids":["https://openalex.org/I67031392"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044674658","display_name":"Jianping An","orcid":"https://orcid.org/0000-0002-6441-9711"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianping An","raw_affiliation_strings":["School of Information and Electronics, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6441-9711","affiliations":[{"raw_affiliation_string":"School of Information and Electronics, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006316216","display_name":"Kai Yang","orcid":"https://orcid.org/0000-0003-1059-0705"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Yang","raw_affiliation_strings":["School of Information and Electronics, Beijing Institute of Technology, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1059-0705","affiliations":[{"raw_affiliation_string":"School of Information and Electronics, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100693513","display_name":"Ying He","orcid":"https://orcid.org/0000-0002-7079-8682"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying He","raw_affiliation_strings":["School of Information and Communications Engineering, Dalian University of Technology, Dalian, China"],"raw_orcid":"https://orcid.org/0000-0002-7079-8682","affiliations":[{"raw_affiliation_string":"School of Information and Communications Engineering, Dalian University of Technology, Dalian, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035919267","display_name":"Victor C. M. Leung","orcid":"https://orcid.org/0000-0003-3529-2640"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Victor C. M. Leung","raw_affiliation_strings":["Department of Electrical and Computer Engineering, The University of British Columbia, Vancouver, BC, Canada"],"raw_orcid":"https://orcid.org/0000-0003-3529-2640","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, The University of British Columbia, Vancouver, BC, Canada","institution_ids":["https://openalex.org/I141945490"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.3388,"has_fulltext":false,"cited_by_count":32,"citation_normalized_percentile":{"value":0.91024611,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"68","issue":"7","first_page":"6891","last_page":"6902"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11165","display_name":"Image and Video Quality Assessment","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11409","display_name":"Advanced Wireless Network Optimization","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8036705255508423},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7491195201873779},{"id":"https://openalex.org/keywords/wireless-network","display_name":"Wireless network","score":0.6236810684204102},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.5329628586769104},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5132872462272644},{"id":"https://openalex.org/keywords/arithmetic-underflow","display_name":"Arithmetic underflow","score":0.4959186017513275},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.4934498369693756},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.4852488040924072},{"id":"https://openalex.org/keywords/channel-allocation-schemes","display_name":"Channel allocation schemes","score":0.4508679211139679},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3555777668952942},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.274223268032074},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23191750049591064}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8036705255508423},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7491195201873779},{"id":"https://openalex.org/C108037233","wikidata":"https://www.wikidata.org/wiki/Q11375","display_name":"Wireless network","level":3,"score":0.6236810684204102},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.5329628586769104},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5132872462272644},{"id":"https://openalex.org/C3265923","wikidata":"https://www.wikidata.org/wiki/Q669129","display_name":"Arithmetic underflow","level":2,"score":0.4959186017513275},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.4934498369693756},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4852488040924072},{"id":"https://openalex.org/C114237682","wikidata":"https://www.wikidata.org/wiki/Q5072483","display_name":"Channel allocation schemes","level":3,"score":0.4508679211139679},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3555777668952942},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.274223268032074},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23191750049591064},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tvt.2019.2909055","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tvt.2019.2909055","pdf_url":null,"source":{"id":"https://openalex.org/S10936095","display_name":"IEEE Transactions on Vehicular Technology","issn_l":"0018-9545","issn":["0018-9545","1939-9359"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Vehicular Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G111310164","display_name":"\u8d85\u5bc6\u5ea6\u8702\u7a9d\u7f51\u7edc\u5efa\u6a21\u5206\u6790\u4e0e\u8d44\u6e90\u5206\u914d\u6280\u672f\u7814\u7a76","funder_award_id":"61771054","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G732504972","display_name":null,"funder_award_id":"2018M640079","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G8350575903","display_name":null,"funder_award_id":"61801025","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W595252221","https://openalex.org/W1522301498","https://openalex.org/W1658008008","https://openalex.org/W1664636959","https://openalex.org/W1976944900","https://openalex.org/W2016980626","https://openalex.org/W2021765723","https://openalex.org/W2046063575","https://openalex.org/W2050316560","https://openalex.org/W2051147690","https://openalex.org/W2098046554","https://openalex.org/W2098432798","https://openalex.org/W2118441052","https://openalex.org/W2119683335","https://openalex.org/W2121863487","https://openalex.org/W2129816625","https://openalex.org/W2134240434","https://openalex.org/W2134618125","https://openalex.org/W2141234504","https://openalex.org/W2145339207","https://openalex.org/W2155027007","https://openalex.org/W2164599584","https://openalex.org/W2173248099","https://openalex.org/W2192203593","https://openalex.org/W2344749673","https://openalex.org/W2409027520","https://openalex.org/W2609654676","https://openalex.org/W2734506266","https://openalex.org/W2744401049","https://openalex.org/W2744628735","https://openalex.org/W2744786564","https://openalex.org/W2756144809","https://openalex.org/W2791797404","https://openalex.org/W2794237953","https://openalex.org/W2903151719","https://openalex.org/W2962836907","https://openalex.org/W2963262099","https://openalex.org/W2963864421","https://openalex.org/W2964043796","https://openalex.org/W2964121744","https://openalex.org/W4214717370","https://openalex.org/W4214839495","https://openalex.org/W6631190155","https://openalex.org/W6636881020","https://openalex.org/W6683204974","https://openalex.org/W6692846177","https://openalex.org/W6703271639","https://openalex.org/W7066500546"],"related_works":["https://openalex.org/W4385483253","https://openalex.org/W2909591731","https://openalex.org/W2756144809","https://openalex.org/W2725080322","https://openalex.org/W2742128636","https://openalex.org/W4285093550","https://openalex.org/W2248892642","https://openalex.org/W2904617116","https://openalex.org/W4285101270","https://openalex.org/W2107557358"],"abstract_inverted_index":{"Buffer-aware":[0],"video":[1,16,22,45,59,63,84,101,108,118,123,155,205],"streaming,":[2],"which":[3],"exploits":[4],"the":[5,14,33,37,54,77,89,121,144,153,186,195],"available":[6],"storage":[7],"space":[8],"in":[9,18,25,48,189,207],"user":[10,68],"device":[11],"to":[12,31,35,53,66,79,94],"store":[13],"prefetched":[15],"data":[17,23],"good":[19],"channels":[20,42],"for":[21,98,116,151,203],"use":[24],"poor":[26],"channels,":[27],"has":[28],"been":[29],"proved":[30],"have":[32],"potential":[34],"reduce":[36],"impact":[38],"of":[39,143,158],"fluctuating":[40],"wireless":[41,50,67,83,99,208],"on":[43,178],"user-perceived":[44],"performance.":[46],"However,":[47],"practical":[49],"networks,":[51],"due":[52],"unknown":[55,104],"channel":[56,105],"state":[57,106],"and":[58,107,148,165],"rate,":[60],"providing":[61],"buffer-aware":[62,100,117,204],"streaming":[64,85,102,119,124,156,206],"service":[65],"is":[69,169,201],"a":[70,113,136,173,179],"challenging":[71],"problem.":[72],"In":[73],"this":[74],"paper,":[75],"with":[76],"aim":[78],"design":[80],"an":[81],"autonomous":[82],"system,":[86],"we":[87,111],"apply":[88],"deep":[90,174,180,197],"reinforcement":[91,181,198],"learning":[92,182,199],"approach":[93,200],"dynamic":[95],"resource":[96],"optimization":[97],"under":[103],"rate.":[109],"Specifically,":[110],"define":[112],"reward":[114],"function":[115],"as":[120],"effective":[122,154,202],"time":[125,157],"when":[126],"neither":[127],"video-playback":[128,131],"overflow":[129],"nor":[130],"underflow":[132],"occurs.":[133],"We":[134,184],"propose":[135],"Markov":[137],"decision":[138],"process":[139],"based":[140,177],"problem":[141],"formulation":[142],"joint":[145],"bandwidth":[146,163],"allocation":[147,164],"buffer":[149,166],"management":[150,167],"maximizing":[152],"all":[159],"users.":[160],"The":[161],"optimal":[162],"policy":[168],"learned":[170],"from":[171],"training":[172],"neural":[175],"network":[176],"algorithm.":[183],"simulate":[185],"proposed":[187,196],"algorithm":[188],"Tensorflow.":[190],"Simulation":[191],"results":[192],"verify":[193],"that":[194],"networks.":[209]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
