{"id":"https:\/\/openalex.org\/W4391669357","doi":"https:\/\/doi.org\/10.1016\/j.automatica.2024.111557","title":"Anderson acceleration for partially observable Markov decision processes: A maximum entropy approach","display_name":"Anderson acceleration for partially observable Markov decision processes: A maximum entropy approach","publication_year":2024,"publication_date":"2024-02-08","ids":{"openalex":"https:\/\/openalex.org\/W4391669357","doi":"https:\/\/doi.org\/10.1016\/j.automatica.2024.111557"},"language":"en","primary_location":{"id":"doi:10.1016\/j.automatica.2024.111557","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1016\/j.automatica.2024.111557","pdf_url":null,"source":{"id":"https:\/\/openalex.org\/S51360982","display_name":"Automatica","issn_l":"0005-1098","issn":["0005-1098","1873-2836"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https:\/\/openalex.org\/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https:\/\/openalex.org\/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Automatica","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https:\/\/openalex.org\/A5070897184","display_name":"Mingyu Park","orcid":"https:\/\/orcid.org\/0000-0003-3003-2065"},"institutions":[{"id":"https:\/\/openalex.org\/I139264467","display_name":"Seoul National University","ror":"https:\/\/ror.org\/04h9pn542","country_code":"KR","type":"education","lineage":["https:\/\/openalex.org\/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Mingyu Park","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea","institution_ids":["https:\/\/openalex.org\/I139264467"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jaeuk Shin","orcid":null},"institutions":[{"id":"https:\/\/openalex.org\/I139264467","display_name":"Seoul National University","ror":"https:\/\/ror.org\/04h9pn542","country_code":"KR","type":"education","lineage":["https:\/\/openalex.org\/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaeuk Shin","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea","institution_ids":["https:\/\/openalex.org\/I139264467"]}]},{"author_position":"last","author":{"id":"https:\/\/openalex.org\/A5063507594","display_name":"Insoon Yang","orcid":"https:\/\/orcid.org\/0000-0001-5887-6169"},"institutions":[{"id":"https:\/\/openalex.org\/I139264467","display_name":"Seoul National University","ror":"https:\/\/ror.org\/04h9pn542","country_code":"KR","type":"education","lineage":["https:\/\/openalex.org\/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Insoon Yang","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Automation and Systems Research Institute, Seoul National University, Republic of Korea","institution_ids":["https:\/\/openalex.org\/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https:\/\/openalex.org\/A5063507594"],"corresponding_institution_ids":["https:\/\/openalex.org\/I139264467"],"apc_list":{"value":3500,"currency":"USD","value_usd":3500},"apc_paid":null,"fwci":1.0034,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.78205043,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"163","issue":null,"first_page":"111557","last_page":"111557"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https:\/\/openalex.org\/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},"topics":[{"id":"https:\/\/openalex.org\/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https:\/\/openalex.org\/subfields\/1702","display_name":"Artificial Intelligence"},"field":{"id":"https:\/\/openalex.org\/fields\/17","display_name":"Computer Science"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T10791","display_name":"Advanced Control Systems Optimization","score":0.9987999796867371,"subfield":{"id":"https:\/\/openalex.org\/subfields\/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https:\/\/openalex.org\/fields\/22","display_name":"Engineering"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}},{"id":"https:\/\/openalex.org\/T10876","display_name":"Fault Detection and Control Systems","score":0.9977999925613403,"subfield":{"id":"https:\/\/openalex.org\/subfields\/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https:\/\/openalex.org\/fields\/22","display_name":"Engineering"},"domain":{"id":"https:\/\/openalex.org\/domains\/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https:\/\/openalex.org\/keywords\/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.7321454286575317},{"id":"https:\/\/openalex.org\/keywords\/markov-decision-process","display_name":"Markov decision process","score":0.667229413986206},{"id":"https:\/\/openalex.org\/keywords\/mathematical-optimization","display_name":"Mathematical optimization","score":0.6154382228851318},{"id":"https:\/\/openalex.org\/keywords\/scalability","display_name":"Scalability","score":0.6011749505996704},{"id":"https:\/\/openalex.org\/keywords\/computer-science","display_name":"Computer science","score":0.5944204330444336},{"id":"https:\/\/openalex.org\/keywords\/benchmark","display_name":"Benchmark (surveying)","score":0.5287589430809021},{"id":"https:\/\/openalex.org\/keywords\/observable","display_name":"Observable","score":0.5190504193305969},{"id":"https:\/\/openalex.org\/keywords\/markov-process","display_name":"Markov process","score":0.45191437005996704},{"id":"https:\/\/openalex.org\/keywords\/entropy","display_name":"Entropy (arrow of time)","score":0.44877541065216064},{"id":"https:\/\/openalex.org\/keywords\/algorithm","display_name":"Algorithm","score":0.443978488445282},{"id":"https:\/\/openalex.org\/keywords\/principle-of-maximum-entropy","display_name":"Principle of maximum entropy","score":0.4209808111190796},{"id":"https:\/\/openalex.org\/keywords\/mathematics","display_name":"Mathematics","score":0.3136812746524811},{"id":"https:\/\/openalex.org\/keywords\/artificial-intelligence","display_name":"Artificial intelligence","score":0.18246719241142273}],"concepts":[{"id":"https:\/\/openalex.org\/C17098449","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.7321454286575317},{"id":"https:\/\/openalex.org\/C106189395","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q176789","display_name":"Markov decision process","level":3,"score":0.667229413986206},{"id":"https:\/\/openalex.org\/C126255220","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q141495","display_name":"Mathematical optimization","level":1,"score":0.6154382228851318},{"id":"https:\/\/openalex.org\/C48044578","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q727490","display_name":"Scalability","level":2,"score":0.6011749505996704},{"id":"https:\/\/openalex.org\/C41008148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q21198","display_name":"Computer science","level":0,"score":0.5944204330444336},{"id":"https:\/\/openalex.org\/C185798385","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5287589430809021},{"id":"https:\/\/openalex.org\/C32848918","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q845789","display_name":"Observable","level":2,"score":0.5190504193305969},{"id":"https:\/\/openalex.org\/C159886148","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q176645","display_name":"Markov process","level":2,"score":0.45191437005996704},{"id":"https:\/\/openalex.org\/C106301342","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.44877541065216064},{"id":"https:\/\/openalex.org\/C11413529","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q8366","display_name":"Algorithm","level":1,"score":0.443978488445282},{"id":"https:\/\/openalex.org\/C9679016","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.4209808111190796},{"id":"https:\/\/openalex.org\/C33923547","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q395","display_name":"Mathematics","level":0,"score":0.3136812746524811},{"id":"https:\/\/openalex.org\/C154945302","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18246719241142273},{"id":"https:\/\/openalex.org\/C121332964","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q413","display_name":"Physics","level":0,"score":0},{"id":"https:\/\/openalex.org\/C62520636","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q944","display_name":"Quantum mechanics","level":1,"score":0},{"id":"https:\/\/openalex.org\/C105795698","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q12483","display_name":"Statistics","level":1,"score":0},{"id":"https:\/\/openalex.org\/C13280743","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q131089","display_name":"Geodesy","level":1,"score":0},{"id":"https:\/\/openalex.org\/C77088390","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q8513","display_name":"Database","level":1,"score":0},{"id":"https:\/\/openalex.org\/C205649164","wikidata":"https:\/\/www.wikidata.org\/wiki\/Q1071","display_name":"Geography","level":0,"score":0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016\/j.automatica.2024.111557","is_oa":false,"landing_page_url":"https:\/\/doi.org\/10.1016\/j.automatica.2024.111557","pdf_url":null,"source":{"id":"https:\/\/openalex.org\/S51360982","display_name":"Automatica","issn_l":"0005-1098","issn":["0005-1098","1873-2836"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https:\/\/openalex.org\/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https:\/\/openalex.org\/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Automatica","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https:\/\/metadata.un.org\/sdg\/16","score":0.7900000214576721}],"awards":[],"funders":[{"id":"https:\/\/openalex.org\/F4320322120","display_name":"National Research Foundation of Korea","ror":"https:\/\/ror.org\/013aysd81"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https:\/\/openalex.org\/W1491973539","https:\/\/openalex.org\/W1515891729","https:\/\/openalex.org\/W1532688806","https:\/\/openalex.org\/W1539216098","https:\/\/openalex.org\/W1563317173","https:\/\/openalex.org\/W1605929701","https:\/\/openalex.org\/W1966801132","https:\/\/openalex.org\/W2011418219","https:\/\/openalex.org\/W2034725503","https:\/\/openalex.org\/W2038281434","https:\/\/openalex.org\/W2055921164","https:\/\/openalex.org\/W2071486596","https:\/\/openalex.org\/W2099430963","https:\/\/openalex.org\/W2100514507","https:\/\/openalex.org\/W2119567691","https:\/\/openalex.org\/W2158907787","https:\/\/openalex.org\/W2164819104","https:\/\/openalex.org\/W2169294731","https:\/\/openalex.org\/W2529804031","https:\/\/openalex.org\/W2545546008","https:\/\/openalex.org\/W2593952959","https:\/\/openalex.org\/W2594103415","https:\/\/openalex.org\/W2781726626","https:\/\/openalex.org\/W2946258294","https:\/\/openalex.org\/W2952258289","https:\/\/openalex.org\/W2962938426","https:\/\/openalex.org\/W2970692013","https:\/\/openalex.org\/W2970981858","https:\/\/openalex.org\/W3005380052","https:\/\/openalex.org\/W3007299075","https:\/\/openalex.org\/W3009835149","https:\/\/openalex.org\/W3041718411","https:\/\/openalex.org\/W3098184036","https:\/\/openalex.org\/W3100586730","https:\/\/openalex.org\/W3110347183","https:\/\/openalex.org\/W3120149500","https:\/\/openalex.org\/W3120161765","https:\/\/openalex.org\/W3162263071","https:\/\/openalex.org\/W3196212238","https:\/\/openalex.org\/W3202312176","https:\/\/openalex.org\/W3205338158","https:\/\/openalex.org\/W4226145367","https:\/\/openalex.org\/W4226471227","https:\/\/openalex.org\/W4255064568","https:\/\/openalex.org\/W4285445987","https:\/\/openalex.org\/W4287206514","https:\/\/openalex.org\/W4287765634","https:\/\/openalex.org\/W4297814233","https:\/\/openalex.org\/W4307347247","https:\/\/openalex.org\/W4310419966","https:\/\/openalex.org\/W6684973485","https:\/\/openalex.org\/W6717999219","https:\/\/openalex.org\/W6759637383","https:\/\/openalex.org\/W6762537981","https:\/\/openalex.org\/W6795323799"],"related_works":["https:\/\/openalex.org\/W2999848267","https:\/\/openalex.org\/W2096013579","https:\/\/openalex.org\/W52153049","https:\/\/openalex.org\/W1760611253","https:\/\/openalex.org\/W1515117609","https:\/\/openalex.org\/W1589140671","https:\/\/openalex.org\/W4323315247","https:\/\/openalex.org\/W131709709","https:\/\/openalex.org\/W2294884454","https:\/\/openalex.org\/W3169161914"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}