Skip to content

Commit cc4c7f5

Browse files
committed
updated config for experiment
1 parent 0efb83c commit cc4c7f5

File tree

2 files changed

+30
-10
lines changed

2 files changed

+30
-10
lines changed

configs/flagrun.json

+10-8
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,9 @@
22
"env": {
33
"name": "AntFlagrunBulletEnv-v0",
44
"max_steps": 500,
5-
"ant_env_rew_weight": 1,
5+
"ant_env_rew_weight": 0,
66
"path_rew_weight": 0,
7-
"dist_rew_weight": 0,
7+
"dist_rew_weight": 1,
88
"goal_reach_rew": 500,
99
"kwargs": {
1010
"enclosed": true,
@@ -13,7 +13,7 @@
1313
"max_target_dist": 4,
1414
"max_targets": 0,
1515
"tolerance": 1,
16-
"switch_flag_on_collision": true,
16+
"switch_flag_on_collision": false,
1717
"use_sensor": true
1818
}
1919
},
@@ -25,8 +25,10 @@
2525
},
2626
"policy": {
2727
"layer_sizes": [
28+
128,
2829
256,
29-
256
30+
256,
31+
128
3032
],
3133
"ac_std": 0.01,
3234
"ac_std_decay": 1,
@@ -46,10 +48,10 @@
4648
"use_pos": false
4749
},
4850
"general": {
49-
"name": "flagrun-local-stupid-sensor",
50-
"gens": 200,
51-
"policies_per_gen": 960,
52-
"eps_per_policy": 100,
51+
"name": "flagrun-sensor-distrew-100timeout",
52+
"gens": 201,
53+
"policies_per_gen": 1200,
54+
"eps_per_policy": 10,
5355
"n_policies": 1,
5456
"batch_size": 500,
5557
"seed": null,

run_saved.py

+20-2
Original file line numberDiff line numberDiff line change
@@ -43,13 +43,31 @@ def run_saved(model: torch.nn.Module, env, steps):
4343
timeout = 200
4444
world_size = 10
4545
enclosed = True
46+
tolerance = 1
47+
steps = 1000
48+
max_target_dist = 4
49+
max_targets = 0
50+
switch_flag_on_collision = False
51+
use_sensor = False
52+
53+
e = gym.make(args.env,
54+
enclosed=enclosed,
55+
timeout=timeout,
56+
size=world_size,
57+
tolerance=tolerance,
58+
max_target_dist=max_target_dist,
59+
max_targets=max_targets,
60+
switch_flag_on_collision=switch_flag_on_collision,
61+
use_sensor=use_sensor,
62+
debug=False).unwrapped
4663

47-
e = gym.make(args.env, enclosed=enclosed, timeout=timeout, size=world_size).unwrapped
4864
e.mpi_common_rand = np.random.RandomState()
65+
AntGatherBulletEnv.ant_env_rew_weight = 1
66+
AntGatherBulletEnv.path_rew_weight = 0
67+
AntGatherBulletEnv.dist_rew_weight = 0
4968

5069
e.render('human')
5170
e.reset()
52-
steps = 1000
5371
if args.record:
5472
e.scene._p.startStateLogging(e.scene._p.STATE_LOGGING_VIDEO_MP4, '~/Documents/es/testvid.mp4')
5573

0 commit comments

Comments
 (0)