Skip to content

Commit

Permalink
Turn down gain on GAIL discriminator output (#4762) (#4772)
Browse files Browse the repository at this point in the history
  • Loading branch information
andrewcoh authored Dec 18, 2020
1 parent a2b81c3 commit 30ed097
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -80,7 +80,7 @@ def test_reward_decreases(
init_reward_expert = gail_rp.evaluate(buffer_expert)[0]
init_reward_policy = gail_rp.evaluate(buffer_policy)[0]

for _ in range(10):
for _ in range(20):
gail_rp.update(buffer_policy)
reward_expert = gail_rp.evaluate(buffer_expert)[0]
reward_policy = gail_rp.evaluate(buffer_policy)[0]
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -103,7 +103,7 @@ def __init__(self, specs: BehaviorSpec, settings: GAILSettings) -> None:
)

self._estimator = torch.nn.Sequential(
linear_layer(estimator_input_size, 1), torch.nn.Sigmoid()
linear_layer(estimator_input_size, 1, kernel_gain=0.2), torch.nn.Sigmoid()
)

def get_action_input(self, mini_batch: AgentBuffer) -> torch.Tensor:
Expand Down

0 comments on commit 30ed097

Please sign in to comment.