Skip to content

Commit 9eaf9ce

Browse files
Erik JennerErik Jenner
Erik Jenner
authored and
Erik Jenner
committed
Update dates after copying
1 parent e58646b commit 9eaf9ce

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

44 files changed

+8
-5
lines changed

.circleci/config.yml

100644100755
File mode changed.

.dockerignore

100644100755
File mode changed.

.gitignore

100644100755
File mode changed.

Dockerfile

100644100755
File mode changed.

README.md

100644100755
File mode changed.

pyproject.toml

100644100755
File mode changed.

scripts/create_rollouts.sh

+2-1
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,8 @@ set -euxo pipefail
55

66
env_name="$1"
77
AGENT="results/expert_demos/$env_name/policies/final/model.zip"
8-
ROLLOUTS="[(0, \"$AGENT\", \"expert\")]"
8+
# ROLLOUTS="[(0, \"$AGENT\", \"expert\")]"
9+
ROLLOUTS="[(1, None, \"random\")]"
910

1011
exec xvfb-run poetry run python src/reward_preprocessing/create_rollouts.py with \
1112
"rollouts=$ROLLOUTS" \

scripts/plot_mountain_car.sh

+6-4
Original file line numberDiff line numberDiff line change
@@ -34,21 +34,23 @@ done
3434

3535
ROLLOUT_PATH="results/expert_demos/seals_mountain_car/rollouts/final.pkl"
3636
ROLLOUT="(0, None, \"expert\", \"$ROLLOUT_PATH\")"
37+
DRLHP_ROLLOUT_PATH="old_results/rollouts/mountain_car/expert.pkl"
38+
DRLHP_ROLLOUT="(0, None, \"expert\", \"$DRLHP_ROLLOUT_PATH\")"
3739

3840
mkdir -p fig/mountain_car
3941

4042
if [[ $DRLHP == 1 ]]; then
41-
MODEL_PATHS=$(find processed/preference_comparisons -type f -path "*/shaped_mountain_car*_medium*.pt" -printf "%P\n" | sed 's/\.[a-z0-9_]*\.pt$//' | sort | uniq)
43+
MODEL_PATHS=$(find processed/preference_comparisons -type f -path "*/shaped_mountain_car*.pt" -printf "%P\n" | sed 's/\.[a-z0-9_]*\.pt$//' | sort | uniq)
4244
path_list=$(echo $MODEL_PATHS | sed 's/\(\S*\)/"\1",/g')
4345
path_list="[$path_list]"
4446
echo $path_list
4547
for mode in l1 log; do
46-
poetry run python -m reward_preprocessing.plot_reward_curves with \
48+
poetry run python -m reward_preprocessing.plot_drlhp_curves with \
4749
env.mountain_car \
4850
base_path=processed/preference_comparisons \
4951
"model_base_paths=$path_list" \
50-
save_path=fig/mountain_car/preference_comparisons_medium_$mode.pdf \
51-
"rollout_cfg=$ROLLOUT" \
52+
save_path=fig/mountain_car/preference_comparisons_$mode.pdf \
53+
"rollout_cfg=$DRLHP_ROLLOUT" \
5254
$mode
5355
done
5456
fi

setup.cfg

100644100755
File mode changed.

setup.py

100644100755
File mode changed.

src/reward_preprocessing/__init__.py

100644100755
File mode changed.

src/reward_preprocessing/create_densities.py

100644100755
File mode changed.

src/reward_preprocessing/create_models.py

100644100755
File mode changed.

src/reward_preprocessing/create_rollouts.py

100644100755
File mode changed.

src/reward_preprocessing/data.py

100644100755
File mode changed.

src/reward_preprocessing/env/__init__.py

100644100755
File mode changed.

src/reward_preprocessing/env/env_ingredient.py

100644100755
File mode changed.

src/reward_preprocessing/interp/__init__.py

100644100755
File mode changed.

src/reward_preprocessing/interp/fixed_processor.py

100644100755
File mode changed.

src/reward_preprocessing/interp/gridworld_plot.py

100644100755
File mode changed.

src/reward_preprocessing/interp/noise.py

100644100755
File mode changed.

src/reward_preprocessing/interp/optimize.py

100644100755
File mode changed.

src/reward_preprocessing/interp/plot_heatmaps.py

100644100755
File mode changed.

src/reward_preprocessing/interp/plot_rewards.py

100644100755
File mode changed.

src/reward_preprocessing/interp/value_net_shaping.py

100644100755
File mode changed.

src/reward_preprocessing/interpret.py

100644100755
File mode changed.

src/reward_preprocessing/models.py

100644100755
File mode changed.

src/reward_preprocessing/optimize_continuous.py

100644100755
File mode changed.

src/reward_preprocessing/optimize_tabular.py

100644100755
File mode changed.

src/reward_preprocessing/plot_heatmaps.py

100644100755
File mode changed.

src/reward_preprocessing/plot_reward_curves.py

100644100755
File mode changed.

src/reward_preprocessing/policy.py

100644100755
File mode changed.

src/reward_preprocessing/preprocessing/__init__.py

100644100755
File mode changed.

src/reward_preprocessing/preprocessing/fixed_potentials.py

100644100755
File mode changed.

src/reward_preprocessing/preprocessing/potential_shaping.py

100644100755
File mode changed.

src/reward_preprocessing/preprocessing/preprocessor.py

100644100755
File mode changed.

src/reward_preprocessing/types.py

100644100755
File mode changed.

src/reward_preprocessing/utils.py

100644100755
File mode changed.

src/reward_preprocessing/wandb_logger.py

100644100755
File mode changed.

tests/conftest.py

100644100755
File mode changed.

tests/test_envs.py

100644100755
File mode changed.

tests/test_maze.py

100644100755
File mode changed.

tests/test_potential_shaping.py

100644100755
File mode changed.

tests/test_training_pipeline.py

100644100755
File mode changed.

0 commit comments

Comments
 (0)