Skip to content

Commit

Permalink
Update config
Browse files Browse the repository at this point in the history
  • Loading branch information
Skylark0924 committed Aug 24, 2023
1 parent 147a41e commit e5c3428
Show file tree
Hide file tree
Showing 16 changed files with 48 additions and 0 deletions.
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/AntPPORofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/BaseTaskA2CRofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/BaseTaskAMPRofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/BaseTaskPPORofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: True # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/BaseTaskSACRofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 1000 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/BaseTaskTD3RofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/CURICabinetPPORofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/CURICabinetSACRofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
3 changes: 3 additions & 0 deletions rofunc/config/learning/rl/train/FrankaCabinetPPORofuncRL.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 16 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,10 @@ Trainer:
start_learning_steps: 0 # The number of steps to take before starting network updating.
seed: 42 # The random seed.
rollouts: 32 # The number of rollouts before updating.
eval_flag: False # If true, run evaluation.
eval_freq: 2500 # The frequency of evaluation. (timesteps)
eval_steps: 1000 # The number of steps to run for evaluation.
use_eval_thread: True # If true, use a separate thread for evaluation.
inference_steps: 1000 # The number of steps to run for inference.
max_episode_steps: 200 # The maximum number of steps per episode.

Expand Down

0 comments on commit e5c3428

Please sign in to comment.