Skip to content

Commit

Permalink
naming convention
Browse files Browse the repository at this point in the history
  • Loading branch information
qiaoting159753 committed Jan 9, 2025
1 parent ca34d5f commit 799b8e3
Show file tree
Hide file tree
Showing 51 changed files with 739 additions and 0 deletions.
33 changes: 33 additions & 0 deletions env_acrobot_swingup/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
{
"algorithm": "DynaSAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"world_model_lr": 0.001,
"horizon": 1,
"num_samples": 10,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_acrobot_swingup/Dyna/DynaSAC_Bounded_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swingup",
"domain": "acrobot"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15, 25, 35, 45, 55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
34 changes: 34 additions & 0 deletions env_acrobot_swingup/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
{
"algorithm": "STEVESAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"num_rwd_models": 5,

"world_model_lr": 0.001,
"horizon": 3,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_acrobot_swingup/STEVE/STEVESAC_3_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swingup",
"domain": "acrobot"
}
5 changes: 5 additions & 0 deletions env_acrobot_swingup/STEVE/STEVESAC_3_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15,25,35,45,55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
33 changes: 33 additions & 0 deletions env_cheetah_run/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
{
"algorithm": "DynaSAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"world_model_lr": 0.001,
"horizon": 1,
"num_samples": 10,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_cheetah_run/Dyna/DynaSAC_Bounded_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "run",
"domain": "cheetah"
}
5 changes: 5 additions & 0 deletions env_cheetah_run/Dyna/DynaSAC_Bounded_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15, 25, 35, 45, 55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
34 changes: 34 additions & 0 deletions env_cheetah_run/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
{
"algorithm": "STEVESAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"num_rwd_models": 5,

"world_model_lr": 0.001,
"horizon": 3,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_cheetah_run/STEVE/STEVESAC_3_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "run",
"domain": "cheetah"
}
5 changes: 5 additions & 0 deletions env_cheetah_run/STEVE/STEVESAC_3_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15,25,35,45,55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
33 changes: 33 additions & 0 deletions env_finger_turn_hard/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
{
"algorithm": "DynaSAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"world_model_lr": 0.001,
"horizon": 1,
"num_samples": 10,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_finger_turn_hard/Dyna/DynaSAC_Bounded_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "turn_hard",
"domain": "finger"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15, 25, 35, 45, 55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
34 changes: 34 additions & 0 deletions env_finger_turn_hard/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
{
"algorithm": "STEVESAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"num_rwd_models": 5,

"world_model_lr": 0.001,
"horizon": 3,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_finger_turn_hard/STEVE/STEVESAC_3_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "turn_hard",
"domain": "finger"
}
5 changes: 5 additions & 0 deletions env_finger_turn_hard/STEVE/STEVESAC_3_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15,25,35,45,55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
33 changes: 33 additions & 0 deletions env_fish_swim/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
{
"algorithm": "DynaSAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"world_model_lr": 0.001,
"horizon": 1,
"num_samples": 10,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_fish_swim/Dyna/DynaSAC_Bounded_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swim",
"domain": "fish"
}
5 changes: 5 additions & 0 deletions env_fish_swim/Dyna/DynaSAC_Bounded_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15, 25, 35, 45, 55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
34 changes: 34 additions & 0 deletions env_fish_swim/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
{
"algorithm": "STEVESAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 1000000,
"max_steps_exploration": 256,
"max_steps_training": 1000000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"num_rwd_models": 5,

"world_model_lr": 0.001,
"horizon": 3,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
}
5 changes: 5 additions & 0 deletions env_fish_swim/STEVE/STEVESAC_3_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swim",
"domain": "fish"
}
5 changes: 5 additions & 0 deletions env_fish_swim/STEVE/STEVESAC_3_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15,25,35,45,55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
Loading

0 comments on commit 799b8e3

Please sign in to comment.