@@ -38,7 +38,7 @@ def __init__(self, use_discrete):
38
38
super ().__init__ ()
39
39
self .discrete = use_discrete
40
40
self ._brains : Dict [str , BrainParameters ] = {}
41
- self . _brains [ BRAIN_NAME ] = BrainParameters (
41
+ brain_params = BrainParameters (
42
42
brain_name = BRAIN_NAME ,
43
43
vector_observation_space_size = OBS_SIZE ,
44
44
num_stacked_vector_observations = 1 ,
@@ -47,11 +47,12 @@ def __init__(self, use_discrete):
47
47
vector_action_descriptions = ["moveDirection" ],
48
48
vector_action_space_type = 0 if use_discrete else 1 ,
49
49
)
50
+ self ._brains [BRAIN_NAME ] = brain_params
50
51
51
52
# state
52
53
self .position = 0.0
53
54
self .step_count = 0
54
- self .random = random .Random (str (self . _brains ))
55
+ self .random = random .Random (str (brain_params ))
55
56
self .goal = self .random .choice ([- 1 , 1 ])
56
57
57
58
def step (
@@ -228,7 +229,7 @@ def _check_environment_trains(env, config):
228
229
print (tc ._get_measure_vals ())
229
230
for brain_name , mean_reward in tc ._get_measure_vals ().items ():
230
231
assert not math .isnan (mean_reward )
231
- assert mean_reward > 0.9
232
+ assert mean_reward > 0.99
232
233
233
234
234
235
@pytest .mark .parametrize ("use_discrete" , [True , False ])
0 commit comments