Skip to content

Commit

Permalink
chore(rstaa2024): update experimental scripts
Browse files Browse the repository at this point in the history
This commit updates the experimental scripts.
  • Loading branch information
rickstaa committed Sep 4, 2024
1 parent 27b6fdf commit d285642
Show file tree
Hide file tree
Showing 25 changed files with 417 additions and 44 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:CartPoleCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@ env_name: "stable_gym:FetchReachCost-v1"
ac_kwargs:
hidden_sizes:
actor: [256, 256] # NOTE: Using [256, 256] for consistency with the article.
critic: [64, 64, 16]
# critic: [64, 64, 16]
critic: [256, 256, 16]
activation:
actor: "nn.ReLU"
critic: "nn.ReLU"
Expand Down
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/lac_critic/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed234_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/lac_critic/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed3658_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/lac_critic/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed48104_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/lac_critic/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed567_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/different_steps_per_update/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/lac_critic/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/cartpole/sac_extra/sac_extra_all/han2020_reproduction_sac_cartpole_cost_alpha3_tune_experiment_seed78456_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/lac_critic/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed234_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/lac_critic/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed3658_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/lac_critic/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed48104_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/lac_critic/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed567_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_bigger_initial_alpha.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_different_steps_per_update.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/bigger_initial_alpha/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_bigger_initial_alpha.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/different_steps_per_update/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_different_steps_per_update.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/lac_critic/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_lac_critic.yml
python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_sac_extra_all.yml
# python -m stable_learning_control.run --exp_cfg experiments/staa_et_al_2024/fetch_reach/sac_extra/sac_extra_all/han2020_reproduction_sac_fetch_reach_alpha3_tune_experiment_seed78456_sac_extra_all.yml
Original file line number Diff line number Diff line change
@@ -1,7 +1,6 @@
"""This script is used to perform the data analysis of the alpha3 tuning experiments of
my master thesis.
"""

# import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
Expand Down Expand Up @@ -195,7 +194,7 @@ def calculate_condition_convergence_statistics(
print("Creating {} plot...".format(env_name.replace("_", " ").title()))

# Retrieve data directories and add legend column.
if not Path(DATA_DIR).exists():
if not Path(DATA_DIR).resolve().exists():
raise FileNotFoundError(f"The data directory {DATA_DIR} does not exist.")
all_data_folders = sorted(
[str(f) for f in Path(DATA_DIR).iterdir() if f.is_dir()]
Expand Down
Loading

0 comments on commit d285642

Please sign in to comment.