From 1d707e7c88af29e0d8c2797fe89e7375a3574a41 Mon Sep 17 00:00:00 2001 From: kengz Date: Tue, 4 Apr 2017 08:05:26 -0400 Subject: [PATCH] reschedule lunar and acrobot per --- rl/spec/box2d_experiment_specs.json | 4 ++-- rl/spec/classic_experiment_specs.json | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/rl/spec/box2d_experiment_specs.json b/rl/spec/box2d_experiment_specs.json index c379ec4..7391fbe 100644 --- a/rl/spec/box2d_experiment_specs.json +++ b/rl/spec/box2d_experiment_specs.json @@ -106,7 +106,7 @@ "Policy": "DoubleDQNBoltzmannPolicy", "PreProcessor": "StackStates", "param": { - "train_per_n_new_exp": 5, + "train_per_n_new_exp": 2, "lr": 0.005, "gamma": 0.99, "hidden_layers": [800, 400], @@ -114,7 +114,7 @@ "output_layer_activation": "linear", "exploration_anneal_episodes": 150, "epi_change_lr": 200, - "max_mem_len": 20000 + "max_mem_len": 30000 }, "param_range": { "lr": [0.001, 0.005, 0.01], diff --git a/rl/spec/classic_experiment_specs.json b/rl/spec/classic_experiment_specs.json index 7025538..3917173 100644 --- a/rl/spec/classic_experiment_specs.json +++ b/rl/spec/classic_experiment_specs.json @@ -460,7 +460,7 @@ "Policy": "DoubleDQNBoltzmannPolicy", "PreProcessor": "StackStates", "param": { - "train_per_n_new_exp": 4, + "train_per_n_new_exp": 1, "lr": 0.01, "gamma": 0.99, "hidden_layers": [32],