We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ae5fce7 commit 33cbc80Copy full SHA for 33cbc80
rl/optimistic_initial_values.py
@@ -9,7 +9,7 @@ class Bandit:
9
def __init__(self, m):
10
self.m = m
11
self.mean = 10
12
- self.N = 0
+ self.N = 1
13
14
def pull(self):
15
return np.random.randn() + self.m
0 commit comments