1443 - updated test_reward.py to reflect updates to reward.py so that the correct config values are called i.e. compromisedShouldBeGood on the correct steps during the training run
This commit is contained in:
@@ -28,4 +28,4 @@ def test_rewards_are_being_penalised_at_each_step_function():
|
||||
Average Reward: 2 (26 / 13)
|
||||
"""
|
||||
print("average reward", env.average_reward)
|
||||
assert env.average_reward == 2.0
|
||||
assert env.average_reward == -8.0
|
||||
|
||||
Reference in New Issue
Block a user