From 0915fdd7999d629ec5325985b755a389a46af122 Mon Sep 17 00:00:00 2001 From: justheuristic Date: Mon, 17 Jun 2019 19:20:08 +0300 Subject: [PATCH] fix docstring: session rewards are aggregated --- week01_intro/crossentropy_method.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/week01_intro/crossentropy_method.ipynb b/week01_intro/crossentropy_method.ipynb index a80cb7382..031b7e6e7 100644 --- a/week01_intro/crossentropy_method.ipynb +++ b/week01_intro/crossentropy_method.ipynb @@ -178,7 +178,7 @@ " Select states and actions from games that have rewards >= percentile\n", " :param states_batch: list of lists of states, states_batch[session_i][t]\n", " :param actions_batch: list of lists of actions, actions_batch[session_i][t]\n", - " :param rewards_batch: list of rewards, rewards_batch[session_i][t]\n", + " :param rewards_batch: list of rewards, rewards_batch[session_i]\n", "\n", " :returns: elite_states,elite_actions, both 1D lists of states and respective actions from elite sessions\n", "\n",