{"id":"https://openalex.org/W4407949815","doi":"https://doi.org/10.1109/cdc56724.2024.10886519","title":"Generalized Maximum Entropy Differential Dynamic Programming","display_name":"Generalized Maximum Entropy Differential Dynamic Programming","publication_year":2024,"publication_date":"2024-12-16","ids":{"openalex":"https://openalex.org/W4407949815","doi":"https://doi.org/10.1109/cdc56724.2024.10886519"},"language":"en","primary_location":{"id":"doi:10.1109/cdc56724.2024.10886519","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc56724.2024.10886519","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 63rd Conference on Decision and Control (CDC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074025783","display_name":"Yuichiro Aoyama","orcid":"https://orcid.org/0000-0001-5676-3769"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yuichiro Aoyama","raw_affiliation_strings":["Georgia Institute of Technology,School of Aerospace Engineering,Atlanta,GA,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology,School of Aerospace Engineering,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044505993","display_name":"Evangelos A. Theodorou","orcid":"https://orcid.org/0000-0002-0834-5738"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Evangelos A. Theodorou","raw_affiliation_strings":["Georgia Institute of Technology,School of Aerospace Engineering,Atlanta,GA,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology,School of Aerospace Engineering,Atlanta,GA,USA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3205,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.6648745,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"8825","last_page":"8831"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/principle-of-maximum-entropy","display_name":"Principle of maximum entropy","score":0.5867767333984375},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5654550194740295},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.5443735122680664},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4289282262325287},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.3931722640991211},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.35965269804000854},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.30972468852996826},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1556568145751953}],"concepts":[{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.5867767333984375},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5654550194740295},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.5443735122680664},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4289282262325287},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3931722640991211},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.35965269804000854},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30972468852996826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1556568145751953}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cdc56724.2024.10886519","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc56724.2024.10886519","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 63rd Conference on Decision and Control (CDC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1776349877","https://openalex.org/W1964988733","https://openalex.org/W1976627513","https://openalex.org/W1983874169","https://openalex.org/W1984474727","https://openalex.org/W1985892240","https://openalex.org/W1989818421","https://openalex.org/W1997414622","https://openalex.org/W2009387827","https://openalex.org/W2059374347","https://openalex.org/W2070887543","https://openalex.org/W2074466695","https://openalex.org/W2076037361","https://openalex.org/W2079061079","https://openalex.org/W2108631580","https://openalex.org/W3174208427","https://openalex.org/W3207783658","https://openalex.org/W4212797134","https://openalex.org/W6669051392","https://openalex.org/W6734517396","https://openalex.org/W6741565551","https://openalex.org/W6754404211","https://openalex.org/W6758491413","https://openalex.org/W6838650158","https://openalex.org/W6903351479"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W2053286651","https://openalex.org/W2181743346","https://openalex.org/W2187401768","https://openalex.org/W2181413294","https://openalex.org/W2052122378","https://openalex.org/W2544423928","https://openalex.org/W2062023542","https://openalex.org/W814774360"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,23,35,103],"sampling-based":[3],"trajectory":[4,125],"optimization":[5],"method":[6,21],"derived":[7],"from":[8],"the":[9,26,45,48,51,64,71,75,81,85,93,121,124,139,142],"maximum":[10],"entropy":[11,89],"formulation":[12,95],"of":[13,25,53,74,84,123,141],"Differential":[14],"Dynamic":[15],"Programming":[16],"with":[17,29,59,87,96,102,131,135],"Tsallis":[18,46,88],"entropy.":[19],"This":[20,77],"is":[22,67,80,126],"generalization":[24],"legacy":[27],"work":[28],"Shannon":[30,97],"entropy,":[31,47,98],"which":[32,55,99],"leads":[33],"to":[34,70,92,108],"Gaussian":[36],"optimal":[37],"control":[38],"policy":[39,49],"for":[40],"exploration":[41,58,116],"during":[42],"optimization.":[43],"With":[44],"takes":[50],"form":[52],"q-Gaussian,":[54],"further":[56],"encourages":[57],"its":[60],"heavy-tailed":[61],"shape.":[62],"Moreover,":[63],"sampling":[65],"variance":[66,101],"scaled":[68],"according":[69],"value":[72],"function":[73],"trajectory.":[76],"scaling":[78],"mechanism":[79],"unique":[82],"property":[83],"algorithm":[86],"in":[90],"contrast":[91],"original":[94],"scales":[100],"fixed":[104],"temperature":[105],"parameter.":[106],"Due":[107],"this":[109],"property,":[110],"our":[111],"proposed":[112,143],"algorithms":[113],"can":[114],"promote":[115],"when":[117],"necessary,":[118],"that":[119],"is,":[120],"cost":[122,137],"high.":[127],"The":[128],"simulation":[129],"results":[130],"two":[132],"robotic":[133],"systems":[134],"multimodal":[136],"demonstrate":[138],"properties":[140],"algorithm.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
