<?xml version="1.0" encoding="utf-8"?>
<?xml-stylesheet type="text/xsl" href="style/detail_T.xsl"?>
<bibitem type="J">   <ARLID>0399560</ARLID> <utime>20240903170627.7</utime><mtime>20131203235959.9</mtime>   <SCOPUS>84889006605</SCOPUS> <WOS>000328665200004</WOS>         <title language="eng" primary="1">Approximate Dynamic Programming Based on High Dimensional Model Representation</title>  <specification> <page_count>18 s.</page_count> <media_type>P</media_type> </specification>    <serial><ARLID>cav_un_epca*0297163</ARLID><ISSN>0023-5954</ISSN><title>Kybernetika</title><part_num/><part_title/><volume_id>49</volume_id><volume>5 (2013)</volume><page_num>720-737</page_num><publisher><place/><name>Ústav teorie informace a automatizace AV ČR, v. v. i.</name><year/></publisher></serial>    <keyword>approximate dynamic programming</keyword>   <keyword>Bellman equation</keyword>   <keyword>approximate HDMR minimization</keyword>   <keyword>trust region problem</keyword>    <author primary="1"> <ARLID>cav_un_auth*0234872</ARLID> <full_dept language="cz">Matematická teorie rozhodování</full_dept> <full_dept language="eng">Department of Decision Making Theory</full_dept> <department language="cz">MTR</department> <department language="eng">MTR</department> <full_dept>Department of Decision Making Theory</full_dept>  <name1>Pištěk</name1> <name2>Miroslav</name2> <institution>UTIA-B</institution> <fullinstit>Ústav teorie informace a automatizace AV ČR, v. v. i.</fullinstit> </author>   <source> <url>http://library.utia.cas.cz/separaty/2013/AS/pistek-0399560.pdf</url> </source>        <cas_special> <project> <ARLID>cav_un_auth*0273082</ARLID> <project_id>GAP102/11/0437</project_id> <agency>GA ČR</agency> <country>CZ</country> </project>  <abstract language="eng" primary="1">This article introduces an algorithm for implicit High Dimensional Model Representation  (HDMR) of the Bellman equation. This approximation technique reduces memory demands  of the algorithm considerably. Moreover, we show that HDMR enables fast approximate min-  imization which is essential for evaluation of the Bellman function. In each time step, the  problem of parametrized HDMR minimization is relaxed into trust region problems, all sharing  the same matrix. Finding its eigenvalue decomposition, we effectively achieve estimates of all  minima. Their full-domain representation is avoided by HDMR and then the same approach  is used recursively in the next time step. An illustrative example of N-armed bandit problem  is included. We assume that the newly established connection between approximate HDMR  minimization and the trust region problem can be beneficial also to many other applications.</abstract>     <RIV>BC</RIV>    <reportyear>2014</reportyear>     <unknown tag="mrcbC52"> 4 O 4o 20231122135935.5 </unknown> <inst_support> RVO:67985556 </inst_support>  <permalink>http://hdl.handle.net/11104/0226953</permalink>          <unknown tag="mrcbT16-e">COMPUTERSCIENCECYBERNETICS</unknown> <unknown tag="mrcbT16-f">0.577</unknown> <unknown tag="mrcbT16-g">0.098</unknown> <unknown tag="mrcbT16-h">9.IV</unknown> <unknown tag="mrcbT16-i">0.00191</unknown> <unknown tag="mrcbT16-j">0.341</unknown> <unknown tag="mrcbT16-k">655</unknown> <unknown tag="mrcbT16-l">61</unknown> <unknown tag="mrcbT16-s">0.348</unknown> <unknown tag="mrcbT16-z">ScienceCitationIndexExpanded</unknown> <unknown tag="mrcbT16-4">Q2</unknown> <unknown tag="mrcbT16-B">35.159</unknown> <unknown tag="mrcbT16-C">31.250</unknown> <unknown tag="mrcbT16-D">Q3</unknown> <unknown tag="mrcbT16-E">Q3</unknown> <arlyear>2013</arlyear>    <unknown tag="mrcbTft">  Soubory v repozitáři: pistek-0399560.pdf </unknown>    <unknown tag="mrcbU14"> 84889006605 SCOPUS </unknown> <unknown tag="mrcbU34"> 000328665200004 WOS </unknown> <unknown tag="mrcbU63"> cav_un_epca*0297163 Kybernetika 0023-5954 Roč. 49 č. 5 2013 720 737 Ústav teorie informace a automatizace AV ČR, v. v. i. </unknown> </cas_special> </bibitem>