mirror of
https://github.com/labmlai/annotated_deep_learning_paper_implementations.git
synced 2025-11-03 13:57:48 +08:00
dqn experiment link
This commit is contained in:
@ -19,7 +19,7 @@ This is a [PyTorch](https://pytorch.org) implementation of paper
|
||||
Here is the [experiment](experiment.html) and [model](model.html) implementation.
|
||||
|
||||
[](https://colab.research.google.com/github/labmlai/annotated_deep_learning_paper_implementations/blob/master/labml_nn/rl/dqn/experiment.ipynb)
|
||||
[](https://app.labml.ai/run/a0da8048235511ecb9affd797fa27714)
|
||||
[](https://app.labml.ai/run/fe1ad986237511ec86e8b763a2d3f710)
|
||||
"""
|
||||
|
||||
from typing import Tuple
|
||||
|
||||
@ -146,7 +146,7 @@
|
||||
" # Target model updating interval\n",
|
||||
" 'update_target_model': 250,\n",
|
||||
" # Learning rate.\n",
|
||||
" 'learning_rate': FloatDynamicHyperParam(2.5e-4, (0, 1e-3)),\n",
|
||||
" 'learning_rate': FloatDynamicHyperParam(1e-4, (0, 1e-3)),\n",
|
||||
"}"
|
||||
]
|
||||
},
|
||||
|
||||
@ -10,7 +10,7 @@ This experiment trains a Deep Q Network (DQN) to play Atari Breakout game on Ope
|
||||
It runs the [game environments on multiple processes](../game.html) to sample efficiently.
|
||||
|
||||
[](https://colab.research.google.com/github/labmlai/annotated_deep_learning_paper_implementations/blob/master/labml_nn/rl/dqn/experiment.ipynb)
|
||||
[](https://app.labml.ai/run/a0da8048235511ecb9affd797fa27714)
|
||||
[](https://app.labml.ai/run/fe1ad986237511ec86e8b763a2d3f710)
|
||||
"""
|
||||
|
||||
import numpy as np
|
||||
|
||||
@ -7,7 +7,7 @@ summary: Implementation of neural network model for Deep Q Network (DQN).
|
||||
# Deep Q Network (DQN) Model
|
||||
|
||||
[](https://colab.research.google.com/github/labmlai/annotated_deep_learning_paper_implementations/blob/master/labml_nn/rl/dqn/experiment.ipynb)
|
||||
[](https://app.labml.ai/run/a0da8048235511ecb9affd797fa27714)
|
||||
[](https://app.labml.ai/run/fe1ad986237511ec86e8b763a2d3f710)
|
||||
"""
|
||||
|
||||
import torch
|
||||
|
||||
@ -10,7 +10,7 @@ This implements paper [Prioritized experience replay](https://papers.labml.ai/pa
|
||||
using a binary segment tree.
|
||||
|
||||
[](https://colab.research.google.com/github/labmlai/annotated_deep_learning_paper_implementations/blob/master/labml_nn/rl/dqn/experiment.ipynb)
|
||||
[](https://app.labml.ai/run/a0da8048235511ecb9affd797fa27714)
|
||||
[](https://app.labml.ai/run/fe1ad986237511ec86e8b763a2d3f710)
|
||||
"""
|
||||
|
||||
import random
|
||||
|
||||
Reference in New Issue
Block a user