From 1599d67f8922c02c40ad71e72d0ac17b3bdeb4fc Mon Sep 17 00:00:00 2001 From: Daniel Liu Date: Thu, 10 Sep 2020 16:12:04 +0800 Subject: [PATCH] fix a minior bug for seting prob_leave_bandit of trainsition matrix --- recogym/envs/reco_env_v0.py | 2 +- recogym/envs/reco_env_v1.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/recogym/envs/reco_env_v0.py b/recogym/envs/reco_env_v0.py index a03d60e..b084854 100644 --- a/recogym/envs/reco_env_v0.py +++ b/recogym/envs/reco_env_v0.py @@ -23,7 +23,7 @@ def set_static_params(self): # State transition Matrix between Organic, Bandit, Leave self.state_transition = array([ [0, self.config.prob_organic_to_bandit, self.config.prob_leave_organic], - [self.config.prob_bandit_to_organic, 0, self.config.prob_leave_organic], + [self.config.prob_bandit_to_organic, 0, self.config.prob_leave_bandit], [0.0, 0.0, 1.] ]) diff --git a/recogym/envs/reco_env_v1.py b/recogym/envs/reco_env_v1.py index b0b616c..7cab2ba 100644 --- a/recogym/envs/reco_env_v1.py +++ b/recogym/envs/reco_env_v1.py @@ -53,7 +53,7 @@ def set_static_params(self): # high level transitions between organic, bandit and leave. self.state_transition = np.array([ [0, self.config.prob_organic_to_bandit, self.config.prob_leave_organic], - [self.config.prob_bandit_to_organic, 0, self.config.prob_leave_organic], + [self.config.prob_bandit_to_organic, 0, self.config.prob_leave_bandit], [0.0, 0.0, 1.] ])