{"id":"https://openalex.org/W2588722917","doi":"https://doi.org/10.1109/ssci.2016.7849833","title":"Policy graph pruning and optimization in Monte Carlo Value Iteration for continuous-state POMDPs","display_name":"Policy graph pruning and optimization in Monte Carlo Value Iteration for continuous-state POMDPs","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2588722917","doi":"https://doi.org/10.1109/ssci.2016.7849833","mag":"2588722917"},"language":"en","primary_location":{"id":"doi:10.1109/ssci.2016.7849833","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci.2016.7849833","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075495276","display_name":"Weisheng Qian","orcid":null},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weisheng Qian","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, P.R. China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072120380","display_name":"Quan Liu","orcid":"https://orcid.org/0000-0001-9377-2816"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quan Liu","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, P.R. China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035138959","display_name":"Zongzhang Zhang","orcid":"https://orcid.org/0000-0002-9238-4747"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zongzhang Zhang","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, P.R. China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021091060","display_name":"Zhiyuan Pan","orcid":"https://orcid.org/0000-0001-6035-1070"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyuan Pan","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, P.R. China","institution_ids":["https://openalex.org/I3923682"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101902909","display_name":"Shan Zhong","orcid":"https://orcid.org/0000-0003-0034-6952"},"institutions":[{"id":"https://openalex.org/I3923682","display_name":"Soochow University","ror":"https://ror.org/05t8y2r12","country_code":"CN","type":"education","lineage":["https://openalex.org/I3923682"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shan Zhong","raw_affiliation_strings":["School of Computer Science and Technology, Soochow University, Suzhou, P.R. China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Soochow University, Suzhou, P.R. China","institution_ids":["https://openalex.org/I3923682"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5075495276"],"corresponding_institution_ids":["https://openalex.org/I3923682"],"apc_list":null,"apc_paid":null,"fwci":0.334,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.69021766,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10444","display_name":"Context-Aware Activity Recognition Systems","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10444","display_name":"Context-Aware Activity Recognition Systems","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7859330773353577},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6333985328674316},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6225332617759705},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.6145035624504089},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.5236011743545532},{"id":"https://openalex.org/keywords/node","display_name":"Node (physics)","score":0.4727550148963928},{"id":"https://openalex.org/keywords/monte-carlo-tree-search","display_name":"Monte Carlo tree search","score":0.4508993327617645},{"id":"https://openalex.org/keywords/bellman-equation","display_name":"Bellman equation","score":0.44118013978004456},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.3746264576911926},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.2965565621852875},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1710834801197052}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7859330773353577},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6333985328674316},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6225332617759705},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.6145035624504089},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.5236011743545532},{"id":"https://openalex.org/C62611344","wikidata":"https://www.wikidata.org/wiki/Q1062658","display_name":"Node (physics)","level":2,"score":0.4727550148963928},{"id":"https://openalex.org/C46149586","wikidata":"https://www.wikidata.org/wiki/Q11785332","display_name":"Monte Carlo tree search","level":3,"score":0.4508993327617645},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.44118013978004456},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.3746264576911926},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.2965565621852875},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1710834801197052},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ssci.2016.7849833","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ssci.2016.7849833","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE Symposium Series on Computational Intelligence (SSCI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7400000095367432,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W2214249","https://openalex.org/W123090642","https://openalex.org/W130797843","https://openalex.org/W135762054","https://openalex.org/W206203849","https://openalex.org/W1532688806","https://openalex.org/W1605929701","https://openalex.org/W1679945064","https://openalex.org/W1967850904","https://openalex.org/W1978322215","https://openalex.org/W2025217226","https://openalex.org/W2038475577","https://openalex.org/W2047990226","https://openalex.org/W2055921164","https://openalex.org/W2099430963","https://openalex.org/W2101421095","https://openalex.org/W2109393574","https://openalex.org/W2110962519","https://openalex.org/W2116753650","https://openalex.org/W2118656144","https://openalex.org/W2124595631","https://openalex.org/W2144088174","https://openalex.org/W2144283793","https://openalex.org/W2156950870","https://openalex.org/W2162428884","https://openalex.org/W2168359464","https://openalex.org/W2171084228","https://openalex.org/W2205289028","https://openalex.org/W2287282975","https://openalex.org/W2294100503","https://openalex.org/W2295605012","https://openalex.org/W2438667436","https://openalex.org/W2542673510","https://openalex.org/W2963889160","https://openalex.org/W6604974139","https://openalex.org/W6605405389","https://openalex.org/W6605525015","https://openalex.org/W6608353451","https://openalex.org/W6631864160","https://openalex.org/W6636732284","https://openalex.org/W6676216739","https://openalex.org/W6678541622","https://openalex.org/W6681633084","https://openalex.org/W6681718981","https://openalex.org/W6683336107","https://openalex.org/W6684973485"],"related_works":["https://openalex.org/W2152670157","https://openalex.org/W2386410636","https://openalex.org/W176737593","https://openalex.org/W2808418668","https://openalex.org/W2903299703","https://openalex.org/W2156021013","https://openalex.org/W2016648086","https://openalex.org/W3105579180","https://openalex.org/W4399157305","https://openalex.org/W4281791088"],"abstract_inverted_index":{"Nowadays,":[0],"Partially":[1],"Observation":[2],"Markov":[3],"Decision":[4],"Processes":[5],"(POMDPs)":[6],"provide":[7],"a":[8,38,50,113,118],"principled":[9],"mathematical":[10],"framework":[11],"for":[12,80,184],"solving":[13],"some":[14],"realistic":[15],"problems":[16,31],"with":[17,32,83,190],"continuous":[18,33],"spaces.":[19,35],"The":[20],"recently":[21],"introduced":[22],"Monte":[23],"Carlo":[24],"Value":[25],"Iteration":[26],"(MCVI)":[27],"can":[28],"tackle":[29],"such":[30,86],"state":[34],"It":[36],"uses":[37],"policy":[39,101,114,125,164,188],"graph":[40,60,102,115],"implicitly":[41],"to":[42,71,96],"represent":[43],"the":[44,56,73,81,100,109,124,130,139,147,157,171],"value":[45,131],"function,":[46],"instead":[47],"of":[48,52,58,112,132],"using":[49],"set":[51],"\u03b1-functions":[53],"explicitly.":[54],"However,":[55],"size":[57],"its":[59],"would":[61],"grow":[62],"over":[63],"time":[64],"and":[65,98,137,173,179],"it":[66,77],"doesn't":[67],"take":[68],"any":[69,162],"measure":[70],"optimize":[72,99,108],"graph.":[74,126,165],"This":[75,90],"makes":[76],"not":[78,154],"applicable":[79],"devices":[82],"limited":[84],"resources":[85],"as":[87],"wearable":[88],"watches.":[89],"paper":[91],"introduces":[92],"three":[93],"novel":[94],"techniques":[95],"prune":[97,138,146],"obtained":[103],"by":[104,142],"MCVI.":[105],"First,":[106],"we":[107,128,145],"internal":[110],"structure":[111],"G":[116,136],"whenever":[117],"new":[119],"node":[120,134,160],"is":[121],"added":[122],"into":[123],"Second,":[127],"evaluate":[129],"each":[133],"in":[135,161],"nodes":[140],"dominated":[141],"others.":[143],"Third,":[144],"redundant":[148],"nodes,":[149],"meaning":[150],"that":[151],"they":[152],"are":[153,182],"reachable":[155],"from":[156],"initial":[158],"action":[159],"optimal":[163],"Empirical":[166],"results":[167],"show":[168],"that,":[169],"on":[170],"corridor":[172],"musical":[174],"chairs":[175],"problems,":[176],"our":[177],"pruning":[178],"optimization":[180],"methods":[181],"useful":[183],"constructing":[185],"more":[186],"compact":[187],"graphs":[189],"comparable":[191],"qualities.":[192]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
