@misc{Zajdel_Roman_Epoch-incremental,
 author={Zajdel, Roman},
 howpublished={online},
 publisher={Zielona Góra: Uniwersytet Zielonogórski},
 language={eng},
 abstract={In this article, a new class of the epoch-incremental reinforcement learning algorithm is proposed. In the incremental mode, the fundamental TD(0) or TD([lambda]) algorithm is performed and an environment model is created. In the epoch mode, on the basis of the environment model, the distances of past-active states to the terminal state are computed. These distances and the reinforcement terminal state signal are used to improve the agent policy.},
 title={Epoch-incremental reinforcement learning algorithms},
 type={artykuł},
 keywords={reinforcement learning, epoch-incremental algorithm, grid world},
}