From 003ef8effeb43a53a0f77fbad2551b49752e714e Mon Sep 17 00:00:00 2001 From: Jerry Wu Date: Sun, 29 Oct 2023 17:37:32 +0800 Subject: [PATCH] change initial weights for ucb agent --- agent/ucb_agent.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/agent/ucb_agent.py b/agent/ucb_agent.py index 51f95ef..dfadf2e 100644 --- a/agent/ucb_agent.py +++ b/agent/ucb_agent.py @@ -6,7 +6,7 @@ class UCBAgent(AbstractEpisodicRecommenderAgent): def __init__(self, sess, observation_space, action_space, eval_mode, alpha=1.0, learning_rate=0.001, summary_writer=None): super(UCBAgent, self).__init__(action_space, summary_writer) self._num_candidates = int(action_space.nvec[0]) - self._W = tf.Variable(np.random.normal(size=(self._num_candidates, 3)), name='W') + self._W = tf.Variable(np.random.uniform(0, 10, size=(self._num_candidates, 3)), name='W') self._sess = sess self._return_idx = None self._prev_pred_pr = None