Skip to content

Commit 0ff8f77

Browse files
authored
Turn down gain on GAIL discriminator output (#4762)
1 parent fbd4bd7 commit 0ff8f77

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

ml-agents/mlagents/trainers/tests/torch/test_reward_providers/test_gail.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,7 @@ def test_reward_decreases(
8080
init_reward_expert = gail_rp.evaluate(buffer_expert)[0]
8181
init_reward_policy = gail_rp.evaluate(buffer_policy)[0]
8282

83-
for _ in range(10):
83+
for _ in range(20):
8484
gail_rp.update(buffer_policy)
8585
reward_expert = gail_rp.evaluate(buffer_expert)[0]
8686
reward_policy = gail_rp.evaluate(buffer_policy)[0]

ml-agents/mlagents/trainers/torch/components/reward_providers/gail_reward_provider.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ def __init__(self, specs: BehaviorSpec, settings: GAILSettings) -> None:
103103
)
104104

105105
self._estimator = torch.nn.Sequential(
106-
linear_layer(estimator_input_size, 1), torch.nn.Sigmoid()
106+
linear_layer(estimator_input_size, 1, kernel_gain=0.2), torch.nn.Sigmoid()
107107
)
108108

109109
def get_action_input(self, mini_batch: AgentBuffer) -> torch.Tensor:

0 commit comments

Comments
 (0)