diff --git a/rl/spec/box2d_experiment_specs.json b/rl/spec/box2d_experiment_specs.json index c379ec4..7391fbe 100644 --- a/rl/spec/box2d_experiment_specs.json +++ b/rl/spec/box2d_experiment_specs.json @@ -106,7 +106,7 @@ "Policy": "DoubleDQNBoltzmannPolicy", "PreProcessor": "StackStates", "param": { - "train_per_n_new_exp": 5, + "train_per_n_new_exp": 2, "lr": 0.005, "gamma": 0.99, "hidden_layers": [800, 400], @@ -114,7 +114,7 @@ "output_layer_activation": "linear", "exploration_anneal_episodes": 150, "epi_change_lr": 200, - "max_mem_len": 20000 + "max_mem_len": 30000 }, "param_range": { "lr": [0.001, 0.005, 0.01], diff --git a/rl/spec/classic_experiment_specs.json b/rl/spec/classic_experiment_specs.json index 7025538..3917173 100644 --- a/rl/spec/classic_experiment_specs.json +++ b/rl/spec/classic_experiment_specs.json @@ -460,7 +460,7 @@ "Policy": "DoubleDQNBoltzmannPolicy", "PreProcessor": "StackStates", "param": { - "train_per_n_new_exp": 4, + "train_per_n_new_exp": 1, "lr": 0.01, "gamma": 0.99, "hidden_layers": [32],