Skip to content

Commit

Permalink
bug fix + tqm on benchmark
Browse files Browse the repository at this point in the history
  • Loading branch information
mcpeixoto committed Jun 10, 2023
1 parent 054e74d commit a332c30
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions CardPole_DNN.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,6 +15,7 @@
import os
from os.path import join, exists
import warnings
from tqdm import tqdm
warnings.filterwarnings("ignore")


Expand Down Expand Up @@ -212,7 +213,7 @@ def main(n_layers, seed, batch_size = 16, lr = 0.001, n_episodes = 5000,
episode_reward_history.append(episode_reward) # Add Episode Reward to History


def benchmark(n_layers, seed, batch_size = 16, lr = 0.001, n_episodes = 5000,
def benchmark(n_layers, seed, batch_size = 16, lr = 0.001, n_episodes = 100,
max_steps = 500, gamma = 0.99, epsilon_start = 1, epsilon_decay = 0.99,
epsilon_min = 0.01, buffer_size = 10000, target_update_freq = None,
online_train_freq = None, win_thr = 100, done = False, win = False,
Expand All @@ -231,7 +232,7 @@ def benchmark(n_layers, seed, batch_size = 16, lr = 0.001, n_episodes = 5000,
rewards_over_episodes = []

observation = env.reset()
for episode in range(n_episodes):
for episode in tqdm(range(n_episodes)):
curr_epsisode_rewards = []

state = env.reset()
Expand Down

0 comments on commit a332c30

Please sign in to comment.