mirror of
https://github.com/labmlai/annotated_deep_learning_paper_implementations.git
synced 2025-08-06 15:22:21 +08:00
ppo experiment configs
This commit is contained in:
@ -388,17 +388,7 @@ def main():
|
|||||||
experiment.configs(configs)
|
experiment.configs(configs)
|
||||||
|
|
||||||
# Initialize the trainer
|
# Initialize the trainer
|
||||||
m = Trainer(
|
m = Trainer(**configs)
|
||||||
updates=configs['updates'],
|
|
||||||
epochs=configs['epochs'],
|
|
||||||
n_workers=configs['n_workers'],
|
|
||||||
worker_steps=configs['worker_steps'],
|
|
||||||
batches=configs['batches'],
|
|
||||||
value_loss_coef=configs['value_loss_coef'],
|
|
||||||
entropy_bonus_coef=configs['entropy_bonus_coef'],
|
|
||||||
clip_range=configs['clip_range'],
|
|
||||||
learning_rate=configs['learning_rate'],
|
|
||||||
)
|
|
||||||
|
|
||||||
# Run and monitor the experiment
|
# Run and monitor the experiment
|
||||||
with experiment.start():
|
with experiment.start():
|
||||||
|
2
setup.py
2
setup.py
@ -5,7 +5,7 @@ with open("readme.md", "r") as f:
|
|||||||
|
|
||||||
setuptools.setup(
|
setuptools.setup(
|
||||||
name='labml-nn',
|
name='labml-nn',
|
||||||
version='0.4.114',
|
version='0.4.115',
|
||||||
author="Varuna Jayasiri, Nipun Wijerathne",
|
author="Varuna Jayasiri, Nipun Wijerathne",
|
||||||
author_email="vpjayasiri@gmail.com, hnipun@gmail.com",
|
author_email="vpjayasiri@gmail.com, hnipun@gmail.com",
|
||||||
description="🧑🏫 Implementations/tutorials of deep learning papers with side-by-side notes 📝; including transformers (original, xl, switch, feedback, vit), optimizers (adam, radam, adabelief), gans(dcgan, cyclegan, stylegan2), 🎮 reinforcement learning (ppo, dqn), capsnet, distillation, etc. 🧠",
|
description="🧑🏫 Implementations/tutorials of deep learning papers with side-by-side notes 📝; including transformers (original, xl, switch, feedback, vit), optimizers (adam, radam, adabelief), gans(dcgan, cyclegan, stylegan2), 🎮 reinforcement learning (ppo, dqn), capsnet, distillation, etc. 🧠",
|
||||||
|
Reference in New Issue
Block a user