We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 30b2304 commit 01b8b13Copy full SHA for 01b8b13
lib/envs/gridworld.py
@@ -50,7 +50,7 @@ def __init__(self, shape=[4,4]):
50
s = it.iterindex
51
y, x = it.multi_index
52
53
- # P[s][a] = (prob, next_state, reward, done)
+ # P[s][a] = (prob, next_state, reward, is_done)
54
P[s] = {a : [] for a in range(nA)}
55
56
is_done = lambda s: s == 0 or s == (nS - 1)
0 commit comments