Skip to content

Commit

Permalink
naming convention
Browse files Browse the repository at this point in the history
  • Loading branch information
qiaoting159753 committed Jan 9, 2025
1 parent 799b8e3 commit deb506f
Show file tree
Hide file tree
Showing 22 changed files with 103 additions and 16 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_acrobot_swingup/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
33 changes: 33 additions & 0 deletions env_cartpole_swingup/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
{
"algorithm": "DynaSAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 400000,
"max_steps_exploration": 256,
"max_steps_training": 400000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"world_model_lr": 0.001,
"horizon": 1,
"num_samples": 10,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 5
}
5 changes: 5 additions & 0 deletions env_cartpole_swingup/Dyna/DynaSAC_Bounded_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swingup",
"domain": "cartpole"
}
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15, 25, 35, 45, 55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
34 changes: 34 additions & 0 deletions env_cartpole_swingup/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,34 @@
{
"algorithm": "STEVESAC_Bounded_Yao",
"type": "mbrl",
"G": 1,
"G_model": 5.0,
"batch_size": 256,
"buffer_size": 400000,
"max_steps_exploration": 256,
"max_steps_training": 400000,
"number_steps_per_train_policy": 1,

"reward_scale": 1.0,
"actor_lr": 3e-4,
"critic_lr": 3e-4,
"alpha_lr": 3e-4,
"gamma": 0.99,
"tau": 0.005,

"min_noise": 0.0,
"noise_scale": 0.1,
"noise_decay": 1.0,

"num_models": 6,
"num_rwd_models": 5,

"world_model_lr": 0.001,
"horizon": 3,
"sas": false,
"train_reward": true,
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 5
}
5 changes: 5 additions & 0 deletions env_cartpole_swingup/STEVE/STEVESAC_3_Yao/env_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"gym": "dmcs",
"task": "swingup",
"domain": "cartpole"
}
5 changes: 5 additions & 0 deletions env_cartpole_swingup/STEVE/STEVESAC_3_Yao/train_config.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"seeds": [15,25,35,45,55],
"number_steps_per_evaluation": 10000,
"number_eval_episodes": 10
}
2 changes: 1 addition & 1 deletion env_cheetah_run/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_cheetah_run/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_finger_turn_hard/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_fish_swim/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_fish_swim/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_hopper_hop/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_hopper_hop/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_humanoid_run/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_humanoid_run/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_reacher_hard/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_reacher_hard/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_walker_walk/Dyna/DynaSAC_Bounded_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,5 +29,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}
2 changes: 1 addition & 1 deletion env_walker_walk/STEVE/STEVESAC_3_Yao/alg_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -30,5 +30,5 @@
"train_both": false,
"gripper": false,
"threshold": 1.0,
"exploration_sample": 2
"exploration_sample": 5
}

0 comments on commit deb506f

Please sign in to comment.