<Record><identifier xmlns="http://purl.org/dc/elements/1.1/">URN:NBN:SI:DOC-1M7XGP5K</identifier><date>2015</date><creator>Šter, Branko</creator><creator>Vodopivec, Tom</creator><relation>documents/doc/1/URN_NBN_SI_doc-1M7XGP5K_001.pdf</relation><relation>documents/doc/1/URN_NBN_SI_doc-1M7XGP5K_001.txt</relation><format format_type="issue">3</format><format format_type="volume">82</format><format format_type="type">article</format><format format_type="extent">str. 85-92</format><identifier identifier_type="ISSN">0013-5852</identifier><identifier identifier_type="COBISSID">1536426435</identifier><identifier identifier_type="URN">URN:NBN:SI:doc-1M7XGP5K</identifier><language>eng</language><publisher>Elektrotehniška zveza Slovenije</publisher><source>Elektrotehniški vestnik</source><rights>InC</rights><subject language_type_id="eng">decision problem</subject><subject language_type_id="slv">krmiljenje Monte Carlo</subject><subject language_type_id="slv">krmiljenje on-policy Monte Carlo</subject><subject language_type_id="eng">Monte Carlo control</subject><subject language_type_id="slv">odločitveni problem</subject><subject language_type_id="eng">on-line learning</subject><subject language_type_id="eng">on-policy Monte Carlo control</subject><subject language_type_id="eng">reinforcement learning</subject><subject language_type_id="slv">spodbujevalno učenje</subject><subject language_type_id="slv">sprotno učenje</subject><title>Forgetting early estimates in Monte Carlo control methods</title></Record>