From 9e430d2dba85c6da1a2e851e859d079c3fd1b4cc Mon Sep 17 00:00:00 2001 From: Varuna Jayasiri Date: Sat, 2 Oct 2021 13:57:47 +0530 Subject: [PATCH] ppo experiment configs --- labml_nn/rl/ppo/experiment.py | 12 +----------- setup.py | 2 +- 2 files changed, 2 insertions(+), 12 deletions(-) diff --git a/labml_nn/rl/ppo/experiment.py b/labml_nn/rl/ppo/experiment.py index f35702e1..afc17838 100644 --- a/labml_nn/rl/ppo/experiment.py +++ b/labml_nn/rl/ppo/experiment.py @@ -388,17 +388,7 @@ def main(): experiment.configs(configs) # Initialize the trainer - m = Trainer( - updates=configs['updates'], - epochs=configs['epochs'], - n_workers=configs['n_workers'], - worker_steps=configs['worker_steps'], - batches=configs['batches'], - value_loss_coef=configs['value_loss_coef'], - entropy_bonus_coef=configs['entropy_bonus_coef'], - clip_range=configs['clip_range'], - learning_rate=configs['learning_rate'], - ) + m = Trainer(**configs) # Run and monitor the experiment with experiment.start(): diff --git a/setup.py b/setup.py index b99d4e96..2faea44f 100644 --- a/setup.py +++ b/setup.py @@ -5,7 +5,7 @@ with open("readme.md", "r") as f: setuptools.setup( name='labml-nn', - version='0.4.114', + version='0.4.115', author="Varuna Jayasiri, Nipun Wijerathne", author_email="vpjayasiri@gmail.com, hnipun@gmail.com", description="🧑‍🏫 Implementations/tutorials of deep learning papers with side-by-side notes 📝; including transformers (original, xl, switch, feedback, vit), optimizers (adam, radam, adabelief), gans(dcgan, cyclegan, stylegan2), 🎮 reinforcement learning (ppo, dqn), capsnet, distillation, etc. 🧠",