diff --git a/.gitignore b/.gitignore
index 9619c610..c82e990f 100644
--- a/.gitignore
+++ b/.gitignore
@@ -12,4 +12,5 @@ labml_helpers
 labml_samples
 data
 logs
-html/
\ No newline at end of file
+html/
+diagrams/
\ No newline at end of file
diff --git a/Makefile b/Makefile
index ab61b2d8..e6c25a42 100644
--- a/Makefile
+++ b/Makefile
@@ -23,14 +23,11 @@ uninstall: ## Uninstall
 
 docs: ## Render annotated HTML
 	find ./docs/ -name "*.html" -type f -delete
+	find ./docs/ -name "*.svg" -type f -delete
 	python utils/sitemap.py
+	python utils/diagrams.py
 	cd labml_nn; pylit --remove_empty_sections --title_md -t ../../../pylit/templates/nn -d ../docs -w *
 
-pages-old: ## Copy to lab-ml site
-	cd labml_nn; pylit --remove_empty_sections --title_md -t ../../../pylit/templates/nn_old -d ../html/labml_nn *
-	@cd ../pages; git pull
-	cp -r html/* ../pages/
-
 help: ## Show this help.
 	@fgrep -h "##" $(MAKEFILE_LIST) | fgrep -v fgrep | sed -e 's/\\$$//' | sed -e 's/##//'
 
diff --git a/docs/activations/index.html b/docs/activations/index.html
index 8e818fcf..560b440f 100644
--- a/docs/activations/index.html
+++ b/docs/activations/index.html
@@ -95,19 +95,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/activations/swish.html b/docs/activations/swish.html
index eb7cbe84..123ea8ee 100644
--- a/docs/activations/swish.html
+++ b/docs/activations/swish.html
@@ -134,19 +134,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/capsule_networks/index.html b/docs/capsule_networks/index.html
index 84cb2c05..9db61c64 100644
--- a/docs/capsule_networks/index.html
+++ b/docs/capsule_networks/index.html
@@ -465,19 +465,46 @@ of $\mathcal{L}_k$ for for all $k$.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/capsule_networks/mnist.html b/docs/capsule_networks/mnist.html
index 42ff668a..f01d20d0 100644
--- a/docs/capsule_networks/mnist.html
+++ b/docs/capsule_networks/mnist.html
@@ -549,19 +549,46 @@ take it through decoder to get reconstruction</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/capsule_networks/readme.html b/docs/capsule_networks/readme.html
index 7cb46a86..ceed2e82 100644
--- a/docs/capsule_networks/readme.html
+++ b/docs/capsule_networks/readme.html
@@ -108,19 +108,46 @@ confusions I had with the paper.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/cnn_visualization.html b/docs/cnn/cnn_visualization.html
index ac0ead78..ea5574ac 100644
--- a/docs/cnn/cnn_visualization.html
+++ b/docs/cnn/cnn_visualization.html
@@ -454,19 +454,46 @@ plt.imshow(sobel_h(act[0][idx-1]), cmap=plt.cm.gray)</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/cross_validation.html b/docs/cnn/cross_validation.html
index 9215c235..d238c069 100644
--- a/docs/cnn/cross_validation.html
+++ b/docs/cnn/cross_validation.html
@@ -246,19 +246,46 @@ from nutsml import *</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/models/cnn.html b/docs/cnn/models/cnn.html
index 42c07de8..7c7dd2e1 100644
--- a/docs/cnn/models/cnn.html
+++ b/docs/cnn/models/cnn.html
@@ -479,19 +479,46 @@ Calculate the output shape after applying a convolution</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/ray_tune.html b/docs/cnn/ray_tune.html
index 51dc8d5e..f842fe6c 100644
--- a/docs/cnn/ray_tune.html
+++ b/docs/cnn/ray_tune.html
@@ -273,19 +273,46 @@ ASHA (Asynchronous Successive Halving Algorithm) scheduler
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/utils/cv_train.html b/docs/cnn/utils/cv_train.html
index 1bba00d4..7c854827 100644
--- a/docs/cnn/utils/cv_train.html
+++ b/docs/cnn/utils/cv_train.html
@@ -500,19 +500,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/utils/dataloader.html b/docs/cnn/utils/dataloader.html
index d47437df..622535dd 100644
--- a/docs/cnn/utils/dataloader.html
+++ b/docs/cnn/utils/dataloader.html
@@ -313,19 +313,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/cnn/utils/train.html b/docs/cnn/utils/train.html
index f967270e..93cf1412 100644
--- a/docs/cnn/utils/train.html
+++ b/docs/cnn/utils/train.html
@@ -552,19 +552,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/experiments/cifar10.html b/docs/experiments/cifar10.html
index a9a45378..6e1a0e15 100644
--- a/docs/experiments/cifar10.html
+++ b/docs/experiments/cifar10.html
@@ -108,19 +108,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/experiments/index.html b/docs/experiments/index.html
index b5799458..f1b1177c 100644
--- a/docs/experiments/index.html
+++ b/docs/experiments/index.html
@@ -84,19 +84,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/experiments/mnist.html b/docs/experiments/mnist.html
index b393f096..96d47fbd 100644
--- a/docs/experiments/mnist.html
+++ b/docs/experiments/mnist.html
@@ -416,19 +416,46 @@ This will keep the accuracy metric stats separate for training and validation.</
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/experiments/nlp_autoregression.html b/docs/experiments/nlp_autoregression.html
index 50542f7e..43b06a1f 100644
--- a/docs/experiments/nlp_autoregression.html
+++ b/docs/experiments/nlp_autoregression.html
@@ -965,19 +965,46 @@ We need to transpose it to be sequence first.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/cycle_gan/index.html b/docs/gan/cycle_gan/index.html
index 3fb584f1..37cd1ef5 100644
--- a/docs/gan/cycle_gan/index.html
+++ b/docs/gan/cycle_gan/index.html
@@ -1940,19 +1940,46 @@ in the call to <code>experiment.configs</code></p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/cycle_gan/readme.html b/docs/gan/cycle_gan/readme.html
index b288e2a9..a6c1f8c9 100644
--- a/docs/gan/cycle_gan/readme.html
+++ b/docs/gan/cycle_gan/readme.html
@@ -98,19 +98,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/dcgan/index.html b/docs/gan/dcgan/index.html
index 12f0ef33..1f9c0f37 100644
--- a/docs/gan/dcgan/index.html
+++ b/docs/gan/dcgan/index.html
@@ -370,19 +370,46 @@ generator and discriminator networks</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/dcgan/readme.html b/docs/gan/dcgan/readme.html
index 07410ed2..b85d9be6 100644
--- a/docs/gan/dcgan/readme.html
+++ b/docs/gan/dcgan/readme.html
@@ -98,19 +98,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/index.html b/docs/gan/index.html
index 45cccd83..22423086 100644
--- a/docs/gan/index.html
+++ b/docs/gan/index.html
@@ -102,19 +102,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/original/experiment.html b/docs/gan/original/experiment.html
index 33469fd0..4eef9668 100644
--- a/docs/gan/original/experiment.html
+++ b/docs/gan/original/experiment.html
@@ -599,19 +599,46 @@ Default of <code>0.9</code> fails.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/original/index.html b/docs/gan/original/index.html
index 6944be4d..ba8bef6f 100644
--- a/docs/gan/original/index.html
+++ b/docs/gan/original/index.html
@@ -309,19 +309,46 @@ the above gradient.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/original/readme.html b/docs/gan/original/readme.html
index 08587a98..46bfeb4e 100644
--- a/docs/gan/original/readme.html
+++ b/docs/gan/original/readme.html
@@ -98,19 +98,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/stylegan/discriminator_block.svg b/docs/gan/stylegan/discriminator_block.svg
new file mode 100644
index 00000000..f9ed820b
--- /dev/null
+++ b/docs/gan/stylegan/discriminator_block.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="336px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 231.0 356.0" width="211px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><path class="black-stroke" d="M 170 7 L 170 67 L 40 67 L 40 130.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 135.88 L 36.5 128.88 L 40 130.63 L 43.5 128.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 170 257 L 170 320.63" fill="none" pointer-events="stroke" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 170 325.88 L 166.5 318.88 L 170 320.63 L 173.5 318.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 170 7 L 170 80.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 170 85.88 L 166.5 78.88 L 170 80.63 L 173.5 78.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="0" y="137"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 147px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="151">Downsample</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="130" y="87"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 97px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="170" y="101">3x3 Conv</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="130" y="137"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 147px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="170" y="151">3x3 Conv</text></switch></g><path class="black-stroke" d="M 170 107 L 170 127 L 170 117 L 170 130.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 170 135.88 L 166.5 128.88 L 170 130.63 L 173.5 128.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="130" y="187"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 197px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="170" y="201">Downsample</text></switch></g><path class="black-stroke" d="M 170 157 L 170 180.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 170 185.88 L 166.5 178.88 L 170 180.63 L 173.5 178.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="0" y="187"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 197px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">1x1 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="201">1x1 Conv</text></switch></g><path class="black-stroke" d="M 40 157 L 40 177 L 40 167 L 40 180.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 185.88 L 36.5 178.88 L 40 180.63 L 43.5 178.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="170" cy="247" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 247px; margin-left: 161px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="170" y="251">+</text></switch></g><path class="black-stroke" d="M 170 207 L 170 227 L 170 217 L 170 230.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 170 235.88 L 166.5 228.88 L 170 230.63 L 173.5 228.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 40 207 L 40 247 L 153.63 247" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 158.88 247 L 151.88 250.5 L 153.63 247 L 151.88 243.5 Z" pointer-events="all" stroke-miterlimit="10"/></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/experiment.html b/docs/gan/stylegan/experiment.html
new file mode 100644
index 00000000..2a7ad67b
--- /dev/null
+++ b/docs/gan/stylegan/experiment.html
@@ -0,0 +1,1663 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <meta http-equiv="content-type" content="text/html;charset=utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1.0"/>
+    <meta name="description" content="An annotated PyTorch implementation of StyleGAN2 model training code."/>
+
+    <meta name="twitter:card" content="summary"/>
+    <meta name="twitter:image:src" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
+    <meta name="twitter:title" content="Style GAN 2 Model Training"/>
+    <meta name="twitter:description" content="An annotated PyTorch implementation of StyleGAN2 model training code."/>
+    <meta name="twitter:site" content="@labmlai"/>
+    <meta name="twitter:creator" content="@labmlai"/>
+
+    <meta property="og:url" content="https://nn.labml.ai/gan/stylegan/experiment.html"/>
+    <meta property="og:title" content="Style GAN 2 Model Training"/>
+    <meta property="og:image" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
+    <meta property="og:site_name" content="LabML Neural Networks"/>
+    <meta property="og:type" content="object"/>
+    <meta property="og:title" content="Style GAN 2 Model Training"/>
+    <meta property="og:description" content="An annotated PyTorch implementation of StyleGAN2 model training code."/>
+
+    <title>Style GAN 2 Model Training</title>
+    <link rel="shortcut icon" href="/icon.png"/>
+    <link rel="stylesheet" href="../../pylit.css">
+    <link rel="canonical" href="https://nn.labml.ai/gan/stylegan/experiment.html"/>
+    <!-- Global site tag (gtag.js) - Google Analytics -->
+    <script async src="https://www.googletagmanager.com/gtag/js?id=G-4V3HC8HBLH"></script>
+    <script>
+        window.dataLayer = window.dataLayer || [];
+
+        function gtag() {
+            dataLayer.push(arguments);
+        }
+
+        gtag('js', new Date());
+
+        gtag('config', 'G-4V3HC8HBLH');
+    </script>
+</head>
+<body>
+<div id='container'>
+    <div id="background"></div>
+    <div class='section'>
+        <div class='docs'>
+            <p>
+                <a class="parent" href="/">home</a>
+                <a class="parent" href="../index.html">gan</a>
+                <a class="parent" href="index.html">stylegan</a>
+            </p>
+            <p>
+
+                <a href="https://github.com/lab-ml/labml_nn/tree/master/labml_nn/gan/stylegan/experiment.py">
+                    <img alt="Github"
+                         src="https://img.shields.io/github/stars/lab-ml/nn?style=social"
+                         style="max-width:100%;"/></a>
+                <a href="https://join.slack.com/t/labforml/shared_invite/zt-egj9zvq9-Dl3hhZqobexgT7aVKnD14g/"
+                   rel="nofollow">
+                    <img alt="Join Slact"
+                         src="https://img.shields.io/badge/slack-chat-green.svg?logo=slack"
+                         style="max-width:100%;"/></a>
+                <a href="https://twitter.com/labmlai"
+                   rel="nofollow">
+                    <img alt="Twitter"
+                         src="https://img.shields.io/twitter/follow/labmlai?style=social"
+                         style="max-width:100%;"/></a>
+            </p>
+        </div>
+    </div>
+    <div class='section' id='section-0'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-0'>#</a>
+                </div>
+                <h1><a href="index.html">Style GAN 2</a> Model Training</h1>
+<p>This is the training code for <a href="index.html">Style GAN 2</a> model.</p>
+<p><img alt="Generated Images" src="generated_64.png" /></p>
+<p><em><small>These are $64 \times 64$ images generated after training for about 80K steps.</small></em></p>
+<p><em>Our implementation is a minimalistic Style GAN2 model training code.
+Only single GPU training is supported to keep the implementation simple.
+We managed to shrink it to keep it at less than 500 lines of code, including the training loop.</em></p>
+<p><em>Without DDP (distributed data parallel) and multi-gpu training it will not be possible to train the model
+for large resolutions (128+).
+If you want training code with fp16 and DDP take a look at
+<a href="https://github.com/lucidrains/stylegan2-pytorch">lucidrains/stylegan2-pytorch</a>.</em></p>
+<p>We trained this on <a href="https://github.com/tkarras/progressive_growing_of_gans">CelebA-HQ dataset</a>.
+You can find the download instruction in this
+<a href="https://forums.fast.ai/t/download-celeba-hq-dataset/45873/3">discussion on fast.ai</a>.
+Save the images inside <a href="#dataset_path"><code>data/stylegan</code> folder</a>.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">31</span><span></span><span class="kn">import</span> <span class="nn">math</span>
+<span class="lineno">32</span><span class="kn">from</span> <span class="nn">pathlib</span> <span class="kn">import</span> <span class="n">Path</span>
+<span class="lineno">33</span><span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Iterator</span><span class="p">,</span> <span class="n">Tuple</span>
+<span class="lineno">34</span>
+<span class="lineno">35</span><span class="kn">import</span> <span class="nn">torch</span>
+<span class="lineno">36</span><span class="kn">import</span> <span class="nn">torch.utils.data</span>
+<span class="lineno">37</span><span class="kn">import</span> <span class="nn">torchvision</span>
+<span class="lineno">38</span><span class="kn">from</span> <span class="nn">PIL</span> <span class="kn">import</span> <span class="n">Image</span>
+<span class="lineno">39</span>
+<span class="lineno">40</span><span class="kn">from</span> <span class="nn">labml</span> <span class="kn">import</span> <span class="n">tracker</span><span class="p">,</span> <span class="n">lab</span><span class="p">,</span> <span class="n">monit</span><span class="p">,</span> <span class="n">experiment</span>
+<span class="lineno">41</span><span class="kn">from</span> <span class="nn">labml.configs</span> <span class="kn">import</span> <span class="n">BaseConfigs</span>
+<span class="lineno">42</span><span class="kn">from</span> <span class="nn">labml_helpers.device</span> <span class="kn">import</span> <span class="n">DeviceConfigs</span>
+<span class="lineno">43</span><span class="kn">from</span> <span class="nn">labml_helpers.train_valid</span> <span class="kn">import</span> <span class="n">ModeState</span><span class="p">,</span> <span class="n">hook_model_outputs</span>
+<span class="lineno">44</span><span class="kn">from</span> <span class="nn">labml_nn.gan.stylegan</span> <span class="kn">import</span> <span class="n">Discriminator</span><span class="p">,</span> <span class="n">Generator</span><span class="p">,</span> <span class="n">MappingNetwork</span><span class="p">,</span> <span class="n">GradientPenalty</span><span class="p">,</span> <span class="n">PathLengthPenalty</span>
+<span class="lineno">45</span><span class="kn">from</span> <span class="nn">labml_nn.gan.wasserstein</span> <span class="kn">import</span> <span class="n">DiscriminatorLoss</span><span class="p">,</span> <span class="n">GeneratorLoss</span>
+<span class="lineno">46</span><span class="kn">from</span> <span class="nn">labml_nn.utils</span> <span class="kn">import</span> <span class="n">cycle_dataloader</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-1'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-1'>#</a>
+                </div>
+                <h2>Dataset</h2>
+<p>This loads the training dataset and resize it to the give image size.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">49</span><span class="k">class</span> <span class="nc">Dataset</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">utils</span><span class="o">.</span><span class="n">data</span><span class="o">.</span><span class="n">Dataset</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-2'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-2'>#</a>
+                </div>
+                <ul>
+<li><code>path</code> path to the folder containing the images</li>
+<li><code>image_size</code> size of the image</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">56</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">path</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">image_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-3'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-3'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">61</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-4'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-4'>#</a>
+                </div>
+                <p>Get the paths of all <code>jpg</code> files</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">64</span>        <span class="bp">self</span><span class="o">.</span><span class="n">paths</span> <span class="o">=</span> <span class="p">[</span><span class="n">p</span> <span class="k">for</span> <span class="n">p</span> <span class="ow">in</span> <span class="n">Path</span><span class="p">(</span><span class="n">path</span><span class="p">)</span><span class="o">.</span><span class="n">glob</span><span class="p">(</span><span class="sa">f</span><span class="s1">&#39;**/*.jpg&#39;</span><span class="p">)]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-5'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-5'>#</a>
+                </div>
+                <p>Transformation</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">67</span>        <span class="bp">self</span><span class="o">.</span><span class="n">transform</span> <span class="o">=</span> <span class="n">torchvision</span><span class="o">.</span><span class="n">transforms</span><span class="o">.</span><span class="n">Compose</span><span class="p">([</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-6'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-6'>#</a>
+                </div>
+                <p>Resize the image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">69</span>            <span class="n">torchvision</span><span class="o">.</span><span class="n">transforms</span><span class="o">.</span><span class="n">Resize</span><span class="p">(</span><span class="n">image_size</span><span class="p">),</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-7'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-7'>#</a>
+                </div>
+                <p>Convert to PyTorch tensor</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">71</span>            <span class="n">torchvision</span><span class="o">.</span><span class="n">transforms</span><span class="o">.</span><span class="n">ToTensor</span><span class="p">(),</span>
+<span class="lineno">72</span>        <span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-8'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-8'>#</a>
+                </div>
+                <p>Number of images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">74</span>    <span class="k">def</span> <span class="fm">__len__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-9'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-9'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">76</span>        <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">paths</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-10'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-10'>#</a>
+                </div>
+                <p>Get the the <code>index</code>-th image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">78</span>    <span class="k">def</span> <span class="fm">__getitem__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">index</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-11'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-11'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">80</span>        <span class="n">path</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">paths</span><span class="p">[</span><span class="n">index</span><span class="p">]</span>
+<span class="lineno">81</span>        <span class="n">img</span> <span class="o">=</span> <span class="n">Image</span><span class="o">.</span><span class="n">open</span><span class="p">(</span><span class="n">path</span><span class="p">)</span>
+<span class="lineno">82</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">transform</span><span class="p">(</span><span class="n">img</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-12'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-12'>#</a>
+                </div>
+                <h2>Configurations</h2>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">85</span><span class="k">class</span> <span class="nc">Configs</span><span class="p">(</span><span class="n">BaseConfigs</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-13'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-13'>#</a>
+                </div>
+                <p>Device to train the model on.
+<a href="https://github.com/lab-ml/helpers/blob/master/labml_helpers/device.py"><code>DeviceConfigs</code></a>
+ picks up an available CUDA device or defaults to CPU.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">93</span>    <span class="n">device</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span> <span class="o">=</span> <span class="n">DeviceConfigs</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-14'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-14'>#</a>
+                </div>
+                <p><a href="index.html#discriminator">StyleGAN2 Discriminator</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">96</span>    <span class="n">discriminator</span><span class="p">:</span> <span class="n">Discriminator</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-15'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-15'>#</a>
+                </div>
+                <p><a href="index.html#generator">StyleGAN2 Generator</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">98</span>    <span class="n">generator</span><span class="p">:</span> <span class="n">Generator</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-16'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-16'>#</a>
+                </div>
+                <p><a href="index.html#mapping_network">Mapping network</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">100</span>    <span class="n">mapping_network</span><span class="p">:</span> <span class="n">MappingNetwork</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-17'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-17'>#</a>
+                </div>
+                <p>Discriminator and generator loss functions.
+We use <a href="../wasserstein/index.html">Wasserstein loss</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">104</span>    <span class="n">discriminator_loss</span><span class="p">:</span> <span class="n">DiscriminatorLoss</span>
+<span class="lineno">105</span>    <span class="n">generator_loss</span><span class="p">:</span> <span class="n">GeneratorLoss</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-18'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-18'>#</a>
+                </div>
+                <p>Optimizers</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">108</span>    <span class="n">generator_optimizer</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span>
+<span class="lineno">109</span>    <span class="n">discriminator_optimizer</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span>
+<span class="lineno">110</span>    <span class="n">mapping_network_optimizer</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-19'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-19'>#</a>
+                </div>
+                <p><a href="index.html#gradient_penalty">Gradient Penalty Regularization Loss</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">113</span>    <span class="n">gradient_penalty</span> <span class="o">=</span> <span class="n">GradientPenalty</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-20'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-20'>#</a>
+                </div>
+                <p>Gradient penalty coefficient $\gamma$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">115</span>    <span class="n">gradient_penalty_coefficient</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">10.</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-21'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-21'>#</a>
+                </div>
+                <p><a href="index.html#path_length_penalty">Path length penalty</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">118</span>    <span class="n">path_length_penalty</span><span class="p">:</span> <span class="n">PathLengthPenalty</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-22'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-22'>#</a>
+                </div>
+                <p>Data loader</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">121</span>    <span class="n">loader</span><span class="p">:</span> <span class="n">Iterator</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-23'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-23'>#</a>
+                </div>
+                <p>Batch size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">124</span>    <span class="n">batch_size</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">32</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-24'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-24'>#</a>
+                </div>
+                <p>Dimensionality of $z$ and $w$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">126</span>    <span class="n">d_latent</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">512</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-25'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-25'>#</a>
+                </div>
+                <p>Height/width of the image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">128</span>    <span class="n">image_size</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">32</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-26'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-26'>#</a>
+                </div>
+                <p>Number of layers in the mapping network</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">130</span>    <span class="n">mapping_network_layers</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">8</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-27'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-27'>#</a>
+                </div>
+                <p>Generator &amp; Discriminator learning rate</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">132</span>    <span class="n">learning_rate</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">1e-3</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-28'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-28'>#</a>
+                </div>
+                <p>Mapping network learning rate ($100 \times$ lower than the others)</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">134</span>    <span class="n">mapping_network_learning_rate</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">1e-5</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-29'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-29'>#</a>
+                </div>
+                <p>Number of steps to accumulate gradients on. Use this to increase the effective batch size.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">136</span>    <span class="n">gradient_accumulate_steps</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">1</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-30'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-30'>#</a>
+                </div>
+                <p>$\beta_1$ and $\beta_2$ for Adam optimizer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">138</span>    <span class="n">adam_betas</span><span class="p">:</span> <span class="n">Tuple</span><span class="p">[</span><span class="nb">float</span><span class="p">,</span> <span class="nb">float</span><span class="p">]</span> <span class="o">=</span> <span class="p">(</span><span class="mf">0.0</span><span class="p">,</span> <span class="mf">0.99</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-31'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-31'>#</a>
+                </div>
+                <p>Probability of mixing styles</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">140</span>    <span class="n">style_mixing_prob</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">0.9</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-32'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-32'>#</a>
+                </div>
+                <p>Total number of training steps</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">143</span>    <span class="n">training_steps</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">150_000</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-33'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-33'>#</a>
+                </div>
+                <p>Number of blocks in the generator (calculated based on image resolution)</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">146</span>    <span class="n">n_gen_blocks</span><span class="p">:</span> <span class="nb">int</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-34'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-34'>#</a>
+                </div>
+                <h3>Lazy regularization</h3>
+<p>Instead of calculating the regularization losses, the paper proposes lazy regularization
+where the regularization terms are calculated once in a while.
+This improves the training efficiency a lot.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-35'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-35'>#</a>
+                </div>
+                <p>The interval at which to compute gradient penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">154</span>    <span class="n">lazy_gradient_penalty_interval</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">4</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-36'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-36'>#</a>
+                </div>
+                <p>Path length penalty calculation interval</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">156</span>    <span class="n">lazy_path_penalty_interval</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">32</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-37'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-37'>#</a>
+                </div>
+                <p>Skip calculating path length penalty during the initial phase of training</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">158</span>    <span class="n">lazy_path_penalty_after</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">5_000</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-38'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-38'>#</a>
+                </div>
+                <p>How often to log generated images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">161</span>    <span class="n">log_generated_interval</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">500</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-39'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-39'>#</a>
+                </div>
+                <p>How often to save model checkpoints</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">163</span>    <span class="n">save_checkpoint_interval</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">2_000</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-40'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-40'>#</a>
+                </div>
+                <p>Training mode state for logging activations</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">166</span>    <span class="n">mode</span><span class="p">:</span> <span class="n">ModeState</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-41'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-41'>#</a>
+                </div>
+                <p>Whether to log model layer outputs</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">168</span>    <span class="n">log_layer_outputs</span><span class="p">:</span> <span class="nb">bool</span> <span class="o">=</span> <span class="kc">False</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-42'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-42'>#</a>
+                </div>
+                <p><a id="dataset_path"></a>
+We trained this on <a href="https://github.com/tkarras/progressive_growing_of_gans">CelebA-HQ dataset</a>.
+You can find the download instruction in this
+<a href="https://forums.fast.ai/t/download-celeba-hq-dataset/45873/3">discussion on fast.ai</a>.
+Save the images inside <code>data/stylegan</code> folder.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">175</span>    <span class="n">dataset_path</span><span class="p">:</span> <span class="nb">str</span> <span class="o">=</span> <span class="nb">str</span><span class="p">(</span><span class="n">lab</span><span class="o">.</span><span class="n">get_data_path</span><span class="p">()</span> <span class="o">/</span> <span class="s1">&#39;stylegan2&#39;</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-43'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-43'>#</a>
+                </div>
+                <h3>Initialize</h3>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">177</span>    <span class="k">def</span> <span class="nf">init</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-44'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-44'>#</a>
+                </div>
+                <p>Create dataset</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">182</span>        <span class="n">dataset</span> <span class="o">=</span> <span class="n">Dataset</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">dataset_path</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">image_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-45'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-45'>#</a>
+                </div>
+                <p>Create data loader</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">184</span>        <span class="n">dataloader</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">utils</span><span class="o">.</span><span class="n">data</span><span class="o">.</span><span class="n">DataLoader</span><span class="p">(</span><span class="n">dataset</span><span class="p">,</span> <span class="n">batch_size</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">batch_size</span><span class="p">,</span> <span class="n">num_workers</span><span class="o">=</span><span class="mi">32</span><span class="p">,</span>
+<span class="lineno">185</span>                                                 <span class="n">shuffle</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span> <span class="n">drop_last</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span> <span class="n">pin_memory</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-46'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-46'>#</a>
+                </div>
+                <p>Continuous <a href="../../utils.html#cycle_dataloader">cyclic loader</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">187</span>        <span class="bp">self</span><span class="o">.</span><span class="n">loader</span> <span class="o">=</span> <span class="n">cycle_dataloader</span><span class="p">(</span><span class="n">dataloader</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-47'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-47'>#</a>
+                </div>
+                <p>$\log_2$ of image resolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">190</span>        <span class="n">log_resolution</span> <span class="o">=</span> <span class="nb">int</span><span class="p">(</span><span class="n">math</span><span class="o">.</span><span class="n">log2</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">image_size</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-48'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-48'>#</a>
+                </div>
+                <p>Create discriminator and generator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">193</span>        <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span> <span class="o">=</span> <span class="n">Discriminator</span><span class="p">(</span><span class="n">log_resolution</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span>
+<span class="lineno">194</span>        <span class="bp">self</span><span class="o">.</span><span class="n">generator</span> <span class="o">=</span> <span class="n">Generator</span><span class="p">(</span><span class="n">log_resolution</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">d_latent</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-49'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-49'>#</a>
+                </div>
+                <p>Get number of generator blocks for creating style and noise inputs</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">196</span>        <span class="bp">self</span><span class="o">.</span><span class="n">n_gen_blocks</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="o">.</span><span class="n">n_blocks</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-50'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-50'>#</a>
+                </div>
+                <p>Create mapping network</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">198</span>        <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span> <span class="o">=</span> <span class="n">MappingNetwork</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">d_latent</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network_layers</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-51'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-51'>#</a>
+                </div>
+                <p>Create path length penalty loss</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">200</span>        <span class="bp">self</span><span class="o">.</span><span class="n">path_length_penalty</span> <span class="o">=</span> <span class="n">PathLengthPenalty</span><span class="p">(</span><span class="mf">0.99</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-52'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-52'>#</a>
+                </div>
+                <p>Add model hooks to monitor layer outputs</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">203</span>        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_layer_outputs</span><span class="p">:</span>
+<span class="lineno">204</span>            <span class="n">hook_model_outputs</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">mode</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="p">,</span> <span class="s1">&#39;discriminator&#39;</span><span class="p">)</span>
+<span class="lineno">205</span>            <span class="n">hook_model_outputs</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">mode</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="p">,</span> <span class="s1">&#39;generator&#39;</span><span class="p">)</span>
+<span class="lineno">206</span>            <span class="n">hook_model_outputs</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">mode</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">,</span> <span class="s1">&#39;mapping_network&#39;</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-53'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-53'>#</a>
+                </div>
+                <p>Discriminator and generator losses</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">209</span>        <span class="bp">self</span><span class="o">.</span><span class="n">discriminator_loss</span> <span class="o">=</span> <span class="n">DiscriminatorLoss</span><span class="p">()</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span>
+<span class="lineno">210</span>        <span class="bp">self</span><span class="o">.</span><span class="n">generator_loss</span> <span class="o">=</span> <span class="n">GeneratorLoss</span><span class="p">()</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-54'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-54'>#</a>
+                </div>
+                <p>Create optimizers</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">213</span>        <span class="bp">self</span><span class="o">.</span><span class="n">discriminator_optimizer</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span><span class="p">(</span>
+<span class="lineno">214</span>            <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span>
+<span class="lineno">215</span>            <span class="n">lr</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">learning_rate</span><span class="p">,</span> <span class="n">betas</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">adam_betas</span>
+<span class="lineno">216</span>        <span class="p">)</span>
+<span class="lineno">217</span>        <span class="bp">self</span><span class="o">.</span><span class="n">generator_optimizer</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span><span class="p">(</span>
+<span class="lineno">218</span>            <span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span>
+<span class="lineno">219</span>            <span class="n">lr</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">learning_rate</span><span class="p">,</span> <span class="n">betas</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">adam_betas</span>
+<span class="lineno">220</span>        <span class="p">)</span>
+<span class="lineno">221</span>        <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network_optimizer</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span><span class="p">(</span>
+<span class="lineno">222</span>            <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span>
+<span class="lineno">223</span>            <span class="n">lr</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">mapping_network_learning_rate</span><span class="p">,</span> <span class="n">betas</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">adam_betas</span>
+<span class="lineno">224</span>        <span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-55'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-55'>#</a>
+                </div>
+                <p>Set tracker configurations</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">227</span>        <span class="n">tracker</span><span class="o">.</span><span class="n">set_image</span><span class="p">(</span><span class="s2">&quot;generated&quot;</span><span class="p">,</span> <span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-56'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-56'>#</a>
+                </div>
+                <h3>Sample $w$</h3>
+<p>This samples $z$ randomly and get $w$ from the mapping network.</p>
+<p>We also apply style mixing sometimes where we generate two latent variables
+$z_1$ and $z_2$ and get corresponding $w_1$ and $w_2$.
+Then we randomly sample a cross-over point and apply $w_1$ to
+the generator blocks before the cross-over point and
+$w_2$ to the blocks after.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">229</span>    <span class="k">def</span> <span class="nf">get_w</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">batch_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-57'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-57'>#</a>
+                </div>
+                <p>Mix styles</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">243</span>        <span class="k">if</span> <span class="n">torch</span><span class="o">.</span><span class="n">rand</span><span class="p">(())</span><span class="o">.</span><span class="n">item</span><span class="p">()</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">style_mixing_prob</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-58'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-58'>#</a>
+                </div>
+                <p>Random cross-over point</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">245</span>            <span class="n">cross_over_point</span> <span class="o">=</span> <span class="nb">int</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">rand</span><span class="p">(())</span><span class="o">.</span><span class="n">item</span><span class="p">()</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">n_gen_blocks</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-59'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-59'>#</a>
+                </div>
+                <p>Sample $z_1$ and $z_2$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">247</span>            <span class="n">z2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">d_latent</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span>
+<span class="lineno">248</span>            <span class="n">z1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">d_latent</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-60'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-60'>#</a>
+                </div>
+                <p>Get $w_1$ and $w_2$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">250</span>            <span class="n">w1</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">(</span><span class="n">z1</span><span class="p">)</span>
+<span class="lineno">251</span>            <span class="n">w2</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">(</span><span class="n">z2</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-61'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-61'>#</a>
+                </div>
+                <p>Expand $w_1$ and $w_2$ for the generator blocks and concatenate</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">253</span>            <span class="n">w1</span> <span class="o">=</span> <span class="n">w1</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="p">:]</span><span class="o">.</span><span class="n">expand</span><span class="p">(</span><span class="n">cross_over_point</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
+<span class="lineno">254</span>            <span class="n">w2</span> <span class="o">=</span> <span class="n">w2</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="p">:]</span><span class="o">.</span><span class="n">expand</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">n_gen_blocks</span> <span class="o">-</span> <span class="n">cross_over_point</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span>
+<span class="lineno">255</span>            <span class="k">return</span> <span class="n">torch</span><span class="o">.</span><span class="n">cat</span><span class="p">((</span><span class="n">w1</span><span class="p">,</span> <span class="n">w2</span><span class="p">),</span> <span class="n">dim</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-62'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-62'>#</a>
+                </div>
+                <p>Without mixing</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">257</span>        <span class="k">else</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-63'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-63'>#</a>
+                </div>
+                <p>Sample $z$ and $z$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">259</span>            <span class="n">z</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">d_latent</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-64'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-64'>#</a>
+                </div>
+                <p>Get $w$ and $w$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">261</span>            <span class="n">w</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">(</span><span class="n">z</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-65'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-65'>#</a>
+                </div>
+                <p>Expand $w$ for the generator blocks</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">263</span>            <span class="k">return</span> <span class="n">w</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="p">:]</span><span class="o">.</span><span class="n">expand</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">n_gen_blocks</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-66'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-66'>#</a>
+                </div>
+                <h3>Generate noise</h3>
+<p>This generates noise for each <a href="index.html#generator_block">generator block</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">265</span>    <span class="k">def</span> <span class="nf">get_noise</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">batch_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-67'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-67'>#</a>
+                </div>
+                <p>List to store noise</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">272</span>        <span class="n">noise</span> <span class="o">=</span> <span class="p">[]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-68'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-68'>#</a>
+                </div>
+                <p>Noise resolution starts from $4$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">274</span>        <span class="n">resolution</span> <span class="o">=</span> <span class="mi">4</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-69'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-69'>#</a>
+                </div>
+                <p>Generate noise for each generator block</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">277</span>        <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">n_gen_blocks</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-70'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-70'>#</a>
+                </div>
+                <p>The first block has only one $3 \times 3$ convolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">279</span>            <span class="k">if</span> <span class="n">i</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
+<span class="lineno">280</span>                <span class="n">n1</span> <span class="o">=</span> <span class="kc">None</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-71'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-71'>#</a>
+                </div>
+                <p>Generate noise to add after the first convolution layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">282</span>            <span class="k">else</span><span class="p">:</span>
+<span class="lineno">283</span>                <span class="n">n1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="n">resolution</span><span class="p">,</span> <span class="n">resolution</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-72'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-72'>#</a>
+                </div>
+                <p>Generate noise to add after the second convolution layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">285</span>            <span class="n">n2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="n">resolution</span><span class="p">,</span> <span class="n">resolution</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-73'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-73'>#</a>
+                </div>
+                <p>Add noise tensors to the list</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">288</span>            <span class="n">noise</span><span class="o">.</span><span class="n">append</span><span class="p">((</span><span class="n">n1</span><span class="p">,</span> <span class="n">n2</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-74'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-74'>#</a>
+                </div>
+                <p>Next block has $2 \times$ resolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">291</span>            <span class="n">resolution</span> <span class="o">*=</span> <span class="mi">2</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-75'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-75'>#</a>
+                </div>
+                <p>Return noise tensors</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">294</span>        <span class="k">return</span> <span class="n">noise</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-76'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-76'>#</a>
+                </div>
+                <h3>Generate images</h3>
+<p>This generate images using the generator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">296</span>    <span class="k">def</span> <span class="nf">generate_images</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">batch_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-77'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-77'>#</a>
+                </div>
+                <p>Get $w$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">304</span>        <span class="n">w</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_w</span><span class="p">(</span><span class="n">batch_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-78'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-78'>#</a>
+                </div>
+                <p>Get noise</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">306</span>        <span class="n">noise</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">get_noise</span><span class="p">(</span><span class="n">batch_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-79'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-79'>#</a>
+                </div>
+                <p>Generate images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">309</span>        <span class="n">images</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="p">(</span><span class="n">w</span><span class="p">,</span> <span class="n">noise</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-80'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-80'>#</a>
+                </div>
+                <p>Return images and $w$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">312</span>        <span class="k">return</span> <span class="n">images</span><span class="p">,</span> <span class="n">w</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-81'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-81'>#</a>
+                </div>
+                <h3>Training Step</h3>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">314</span>    <span class="k">def</span> <span class="nf">step</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">idx</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-82'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-82'>#</a>
+                </div>
+                <p>Train the discriminator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">320</span>        <span class="k">with</span> <span class="n">monit</span><span class="o">.</span><span class="n">section</span><span class="p">(</span><span class="s1">&#39;Discriminator&#39;</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-83'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-83'>#</a>
+                </div>
+                <p>Reset gradients</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">322</span>            <span class="bp">self</span><span class="o">.</span><span class="n">discriminator_optimizer</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-84'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-84'>#</a>
+                </div>
+                <p>Accumulate gradients for <code>gradient_accumulate_steps</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">325</span>            <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">gradient_accumulate_steps</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-85'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-85'>#</a>
+                </div>
+                <p>Update <code>mode</code>. Set whether to log activation</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">327</span>                <span class="k">with</span> <span class="bp">self</span><span class="o">.</span><span class="n">mode</span><span class="o">.</span><span class="n">update</span><span class="p">(</span><span class="n">is_log_activations</span><span class="o">=</span><span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_generated_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-86'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-86'>#</a>
+                </div>
+                <p>Sample images from generator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">329</span>                    <span class="n">generated_images</span><span class="p">,</span> <span class="n">_</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">generate_images</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">batch_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-87'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-87'>#</a>
+                </div>
+                <p>Discriminator classification for generated images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">331</span>                    <span class="n">fake_output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="p">(</span><span class="n">generated_images</span><span class="o">.</span><span class="n">detach</span><span class="p">())</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-88'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-88'>#</a>
+                </div>
+                <p>Get real images from the data loader</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">334</span>                    <span class="n">real_images</span> <span class="o">=</span> <span class="nb">next</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">loader</span><span class="p">)</span><span class="o">.</span><span class="n">to</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-89'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-89'>#</a>
+                </div>
+                <p>We need to calculate gradients w.r.t. real images for gradient penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">336</span>                    <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">lazy_gradient_penalty_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
+<span class="lineno">337</span>                        <span class="n">real_images</span><span class="o">.</span><span class="n">requires_grad_</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-90'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-90'>#</a>
+                </div>
+                <p>Discriminator classification for real images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">339</span>                    <span class="n">real_output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="p">(</span><span class="n">real_images</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-91'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-91'>#</a>
+                </div>
+                <p>Get discriminator loss</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">342</span>                    <span class="n">real_loss</span><span class="p">,</span> <span class="n">fake_loss</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator_loss</span><span class="p">(</span><span class="n">real_output</span><span class="p">,</span> <span class="n">fake_output</span><span class="p">)</span>
+<span class="lineno">343</span>                    <span class="n">disc_loss</span> <span class="o">=</span> <span class="n">real_loss</span> <span class="o">+</span> <span class="n">fake_loss</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-92'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-92'>#</a>
+                </div>
+                <p>Add gradient penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">346</span>                    <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">lazy_gradient_penalty_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-93'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-93'>#</a>
+                </div>
+                <p>Calculate and log gradient penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">348</span>                        <span class="n">gp</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">gradient_penalty</span><span class="p">(</span><span class="n">real_images</span><span class="p">,</span> <span class="n">real_output</span><span class="p">)</span>
+<span class="lineno">349</span>                        <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;loss.gp&#39;</span><span class="p">,</span> <span class="n">gp</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-94'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-94'>#</a>
+                </div>
+                <p>Multiply by coefficient and add gradient penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">351</span>                        <span class="n">disc_loss</span> <span class="o">=</span> <span class="n">disc_loss</span> <span class="o">+</span> <span class="mf">0.5</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">gradient_penalty_coefficient</span> <span class="o">*</span> <span class="n">gp</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">lazy_gradient_penalty_interval</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-95'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-95'>#</a>
+                </div>
+                <p>Compute gradients</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">354</span>                    <span class="n">disc_loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-96'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-96'>#</a>
+                </div>
+                <p>Log discriminator loss</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">357</span>                    <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;loss.discriminator&#39;</span><span class="p">,</span> <span class="n">disc_loss</span><span class="p">)</span>
+<span class="lineno">358</span>
+<span class="lineno">359</span>            <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_generated_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-97'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-97'>#</a>
+                </div>
+                <p>Log discriminator model parameters occasionally</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">361</span>                <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;discriminator&#39;</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-98'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-98'>#</a>
+                </div>
+                <p>Clip gradients for stabilization</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">364</span>            <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">utils</span><span class="o">.</span><span class="n">clip_grad_norm_</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span> <span class="n">max_norm</span><span class="o">=</span><span class="mf">1.0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-99'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-99'>#</a>
+                </div>
+                <p>Take optimizer step</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">366</span>            <span class="bp">self</span><span class="o">.</span><span class="n">discriminator_optimizer</span><span class="o">.</span><span class="n">step</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-100'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-100'>#</a>
+                </div>
+                <p>Train the generator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">369</span>        <span class="k">with</span> <span class="n">monit</span><span class="o">.</span><span class="n">section</span><span class="p">(</span><span class="s1">&#39;Generator&#39;</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-101'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-101'>#</a>
+                </div>
+                <p>Reset gradients</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">371</span>            <span class="bp">self</span><span class="o">.</span><span class="n">generator_optimizer</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span>
+<span class="lineno">372</span>            <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network_optimizer</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-102'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-102'>#</a>
+                </div>
+                <p>Accumulate gradients for <code>gradient_accumulate_steps</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">375</span>            <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">gradient_accumulate_steps</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-103'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-103'>#</a>
+                </div>
+                <p>Sample images from generator</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">377</span>                <span class="n">generated_images</span><span class="p">,</span> <span class="n">w</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">generate_images</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">batch_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-104'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-104'>#</a>
+                </div>
+                <p>Discriminator classification for generated images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">379</span>                <span class="n">fake_output</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">discriminator</span><span class="p">(</span><span class="n">generated_images</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-105'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-105'>#</a>
+                </div>
+                <p>Get generator loss</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">382</span>                <span class="n">gen_loss</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">generator_loss</span><span class="p">(</span><span class="n">fake_output</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-106'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-106'>#</a>
+                </div>
+                <p>Add path length penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">385</span>                <span class="k">if</span> <span class="n">idx</span> <span class="o">&gt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">lazy_path_penalty_after</span> <span class="ow">and</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">lazy_path_penalty_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-107'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-107'>#</a>
+                </div>
+                <p>Calculate path length penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">387</span>                    <span class="n">plp</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">path_length_penalty</span><span class="p">(</span><span class="n">w</span><span class="p">,</span> <span class="n">generated_images</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-108'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-108'>#</a>
+                </div>
+                <p>Ignore if <code>nan</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">389</span>                    <span class="k">if</span> <span class="ow">not</span> <span class="n">torch</span><span class="o">.</span><span class="n">isnan</span><span class="p">(</span><span class="n">plp</span><span class="p">):</span>
+<span class="lineno">390</span>                        <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;loss.plp&#39;</span><span class="p">,</span> <span class="n">plp</span><span class="p">)</span>
+<span class="lineno">391</span>                        <span class="n">gen_loss</span> <span class="o">=</span> <span class="n">gen_loss</span> <span class="o">+</span> <span class="n">plp</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-109'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-109'>#</a>
+                </div>
+                <p>Calculate gradients</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">394</span>                <span class="n">gen_loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-110'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-110'>#</a>
+                </div>
+                <p>Log generator loss</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">397</span>                <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;loss.generator&#39;</span><span class="p">,</span> <span class="n">gen_loss</span><span class="p">)</span>
+<span class="lineno">398</span>
+<span class="lineno">399</span>            <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_generated_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-111'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-111'>#</a>
+                </div>
+                <p>Log discriminator model parameters occasionally</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">401</span>                <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;generator&#39;</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="p">)</span>
+<span class="lineno">402</span>                <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;mapping_network&#39;</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-112'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-112'>#</a>
+                </div>
+                <p>Clip gradients for stabilization</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">405</span>            <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">utils</span><span class="o">.</span><span class="n">clip_grad_norm_</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">generator</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span> <span class="n">max_norm</span><span class="o">=</span><span class="mf">1.0</span><span class="p">)</span>
+<span class="lineno">406</span>            <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">utils</span><span class="o">.</span><span class="n">clip_grad_norm_</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">mapping_network</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span> <span class="n">max_norm</span><span class="o">=</span><span class="mf">1.0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-113'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-113'>#</a>
+                </div>
+                <p>Take optimizer step</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">409</span>            <span class="bp">self</span><span class="o">.</span><span class="n">generator_optimizer</span><span class="o">.</span><span class="n">step</span><span class="p">()</span>
+<span class="lineno">410</span>            <span class="bp">self</span><span class="o">.</span><span class="n">mapping_network_optimizer</span><span class="o">.</span><span class="n">step</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-114'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-114'>#</a>
+                </div>
+                <p>Log generated images</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">413</span>        <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_generated_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
+<span class="lineno">414</span>            <span class="n">tracker</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">&#39;generated&#39;</span><span class="p">,</span> <span class="n">torch</span><span class="o">.</span><span class="n">cat</span><span class="p">([</span><span class="n">generated_images</span><span class="p">[:</span><span class="mi">6</span><span class="p">],</span> <span class="n">real_images</span><span class="p">[:</span><span class="mi">3</span><span class="p">]],</span> <span class="n">dim</span><span class="o">=</span><span class="mi">0</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-115'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-115'>#</a>
+                </div>
+                <p>Save model checkpoints</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">416</span>        <span class="k">if</span> <span class="p">(</span><span class="n">idx</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">save_checkpoint_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
+<span class="lineno">417</span>            <span class="n">experiment</span><span class="o">.</span><span class="n">save_checkpoint</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-116'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-116'>#</a>
+                </div>
+                <p>Flush tracker</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">420</span>        <span class="n">tracker</span><span class="o">.</span><span class="n">save</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-117'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-117'>#</a>
+                </div>
+                <h2>Train model</h2>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">422</span>    <span class="k">def</span> <span class="nf">train</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-118'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-118'>#</a>
+                </div>
+                <p>Loop for <code>training_steps</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">428</span>        <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="n">monit</span><span class="o">.</span><span class="n">loop</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">training_steps</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-119'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-119'>#</a>
+                </div>
+                <p>Take a training step</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">430</span>            <span class="bp">self</span><span class="o">.</span><span class="n">step</span><span class="p">(</span><span class="n">i</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-120'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-120'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">432</span>            <span class="k">if</span> <span class="p">(</span><span class="n">i</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">log_generated_interval</span> <span class="o">==</span> <span class="mi">0</span><span class="p">:</span>
+<span class="lineno">433</span>                <span class="n">tracker</span><span class="o">.</span><span class="n">new_line</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-121'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-121'>#</a>
+                </div>
+                <h3>Train StyleGAN2</h3>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">436</span><span class="k">def</span> <span class="nf">main</span><span class="p">():</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-122'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-122'>#</a>
+                </div>
+                <p>Create an experiment</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">442</span>    <span class="n">experiment</span><span class="o">.</span><span class="n">create</span><span class="p">(</span><span class="n">name</span><span class="o">=</span><span class="s1">&#39;stylegan2&#39;</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-123'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-123'>#</a>
+                </div>
+                <p>Create configurations object</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">444</span>    <span class="n">configs</span> <span class="o">=</span> <span class="n">Configs</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-124'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-124'>#</a>
+                </div>
+                <p>Set configurations and override some</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">447</span>    <span class="n">experiment</span><span class="o">.</span><span class="n">configs</span><span class="p">(</span><span class="n">configs</span><span class="p">,</span> <span class="p">{</span>
+<span class="lineno">448</span>        <span class="s1">&#39;device.cuda_device&#39;</span><span class="p">:</span> <span class="mi">0</span><span class="p">,</span>
+<span class="lineno">449</span>        <span class="s1">&#39;image_size&#39;</span><span class="p">:</span> <span class="mi">64</span><span class="p">,</span>
+<span class="lineno">450</span>        <span class="s1">&#39;log_generated_interval&#39;</span><span class="p">:</span> <span class="mi">200</span>
+<span class="lineno">451</span>    <span class="p">})</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-125'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-125'>#</a>
+                </div>
+                <p>Initialize</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">454</span>    <span class="n">configs</span><span class="o">.</span><span class="n">init</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-126'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-126'>#</a>
+                </div>
+                <p>Set models for saving and loading</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">456</span>    <span class="n">experiment</span><span class="o">.</span><span class="n">add_pytorch_models</span><span class="p">(</span><span class="n">mapping_network</span><span class="o">=</span><span class="n">configs</span><span class="o">.</span><span class="n">mapping_network</span><span class="p">,</span>
+<span class="lineno">457</span>                                  <span class="n">generator</span><span class="o">=</span><span class="n">configs</span><span class="o">.</span><span class="n">generator</span><span class="p">,</span>
+<span class="lineno">458</span>                                  <span class="n">discriminator</span><span class="o">=</span><span class="n">configs</span><span class="o">.</span><span class="n">discriminator</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-127'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-127'>#</a>
+                </div>
+                <p>Start the experiment</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">461</span>    <span class="k">with</span> <span class="n">experiment</span><span class="o">.</span><span class="n">start</span><span class="p">():</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-128'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-128'>#</a>
+                </div>
+                <p>Run the training loop</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">463</span>        <span class="n">configs</span><span class="o">.</span><span class="n">train</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-129'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-129'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">466</span><span class="k">if</span> <span class="vm">__name__</span> <span class="o">==</span> <span class="s1">&#39;__main__&#39;</span><span class="p">:</span>
+<span class="lineno">467</span>    <span class="n">main</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    </div>
+</div>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.4/MathJax.js?config=TeX-AMS_HTML">
+</script>
+<!-- MathJax configuration -->
+<script type="text/x-mathjax-config">
+    MathJax.Hub.Config({
+        tex2jax: {
+            inlineMath: [ ['$','$'] ],
+            displayMath: [ ['$$','$$'] ],
+            processEscapes: true,
+            processEnvironments: true
+        },
+        // Center justify equations in code and markdown cells. Elsewhere
+        // we use CSS to left justify single line equations in code cells.
+        displayAlign: 'center',
+        "HTML-CSS": { fonts: ["TeX"] }
+    });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
+
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
+
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
+
+        var modal = document.createElement('div')
+        modal.id = 'modal'
+
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
+
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
+
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
+
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
+
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
+
+    handleImages()
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs/gan/stylegan/generated_64.png b/docs/gan/stylegan/generated_64.png
new file mode 100644
index 00000000..d57a3f2c
Binary files /dev/null and b/docs/gan/stylegan/generated_64.png differ
diff --git a/docs/gan/stylegan/generator_block.svg b/docs/gan/stylegan/generator_block.svg
new file mode 100644
index 00000000..23c1c3ed
--- /dev/null
+++ b/docs/gan/stylegan/generator_block.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="593px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 451.0 613.0" width="431px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="200" y="199"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 209px; margin-left: 201px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="213">3X3 Conv</text></switch></g><path class="black-stroke" d="M 240 264 L 240 402.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 407.88 L 236.5 400.88 L 240 402.63 L 243.5 400.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="240" cy="254" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 254px; margin-left: 231px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="258">+</text></switch></g><path class="black-stroke" d="M 240 219 L 240 239 L 240 224 L 240 237.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 242.88 L 236.5 235.88 L 240 237.63 L 243.5 235.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 295 254 L 256.37 254" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 251.12 254 L 258.12 250.5 L 256.37 254 L 258.12 257.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="295" y="244"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 254px; margin-left: 296px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="305" y="258">B</text></switch></g><path class="black-stroke" d="M 20 159 L 63.63 159" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 68.88 159 L 61.88 162.5 L 63.63 159 L 61.88 155.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="0" y="149"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 159px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="10" y="163">A</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="199"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 209px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="213">Demod</text></switch></g><path class="black-stroke" d="M 110 169 L 110 189 L 110 179 L 110 192.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 197.88 L 106.5 190.88 L 110 192.63 L 113.5 190.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="149"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 159px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="163">Mod</text></switch></g><path class="black-stroke" d="M 110 114 L 110 142.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 147.88 L 106.5 140.88 L 110 142.63 L 113.5 140.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 104px; margin-left: 91px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="108">weights</text></switch></g><path class="black-stroke" d="M 150 209 L 193.63 209" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 198.88 209 L 191.88 212.5 L 193.63 209 L 191.88 205.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="200" y="409"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 419px; margin-left: 201px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="423">3X3 Conv</text></switch></g><path class="black-stroke" d="M 240 474 L 240 577.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 582.88 L 236.5 575.88 L 240 577.63 L 243.5 575.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 240 474 L 240 504 L 273.63 504" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 278.88 504 L 271.88 507.5 L 273.63 504 L 271.88 500.5 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="240" cy="464" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 464px; margin-left: 231px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="468">+</text></switch></g><path class="black-stroke" d="M 240 429 L 240 449 L 240 434 L 240 447.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 452.88 L 236.5 445.88 L 240 447.63 L 243.5 445.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 295 464 L 256.37 464" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 251.12 464 L 258.12 460.5 L 256.37 464 L 258.12 467.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="295" y="454"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 464px; margin-left: 296px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="305" y="468">B</text></switch></g><path class="black-stroke" d="M 20 369 L 63.63 369" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 68.88 369 L 61.88 372.5 L 63.63 369 L 61.88 365.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="0" y="359"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 369px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="10" y="373">A</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="409"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 419px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="423">Demod</text></switch></g><path class="black-stroke" d="M 110 379 L 110 399 L 110 389 L 110 402.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 407.88 L 106.5 400.88 L 110 402.63 L 113.5 400.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="359"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 369px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="373">Mod</text></switch></g><path class="black-stroke" d="M 110 324 L 110 352.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 357.88 L 106.5 350.88 L 110 352.63 L 113.5 350.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 314px; margin-left: 91px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="318">weights</text></switch></g><path class="black-stroke" d="M 150 419 L 193.63 419" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 198.88 419 L 191.88 422.5 L 193.63 419 L 191.88 415.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 160 254 L 223.63 254" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 228.88 254 L 221.88 257.5 L 223.63 254 L 221.88 250.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 254px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="140" y="258">bias</text></switch></g><path class="black-stroke" d="M 160 464 L 223.63 464" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 228.88 464 L 221.88 467.5 L 223.63 464 L 221.88 460.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 464px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="140" y="468">bias</text></switch></g><path class="black-stroke" d="M 240 34 L 240 192.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 197.88 L 236.5 190.88 L 240 192.63 L 243.5 190.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 410 34 L 410 487.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 410 492.88 L 406.5 485.88 L 410 487.63 L 413.5 485.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 410 514 L 410 577.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 410 582.88 L 406.5 575.88 L 410 577.63 L 413.5 575.88 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="410" cy="504" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 504px; margin-left: 401px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="410" y="508">+</text></switch></g><path class="black-stroke" d="M 360 504 L 393.63 504" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 398.88 504 L 391.88 507.5 L 393.63 504 L 391.88 500.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="none" width="80" x="280" y="494"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 504px; margin-left: 281px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="320" y="508">toRGB</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 14px; margin-left: 221px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">feature map</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="18">featur...</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 14px; margin-left: 391px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">rgb</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="410" y="18">rgb</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/index.html b/docs/gan/stylegan/index.html
new file mode 100644
index 00000000..83eae8b1
--- /dev/null
+++ b/docs/gan/stylegan/index.html
@@ -0,0 +1,2685 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <meta http-equiv="content-type" content="text/html;charset=utf-8"/>
+    <meta name="viewport" content="width=device-width, initial-scale=1.0"/>
+    <meta name="description" content="An annotated PyTorch implementation of StyleGAN2."/>
+
+    <meta name="twitter:card" content="summary"/>
+    <meta name="twitter:image:src" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
+    <meta name="twitter:title" content="Style GAN 2"/>
+    <meta name="twitter:description" content="An annotated PyTorch implementation of StyleGAN2."/>
+    <meta name="twitter:site" content="@labmlai"/>
+    <meta name="twitter:creator" content="@labmlai"/>
+
+    <meta property="og:url" content="https://nn.labml.ai/gan/stylegan/index.html"/>
+    <meta property="og:title" content="Style GAN 2"/>
+    <meta property="og:image" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
+    <meta property="og:site_name" content="LabML Neural Networks"/>
+    <meta property="og:type" content="object"/>
+    <meta property="og:title" content="Style GAN 2"/>
+    <meta property="og:description" content="An annotated PyTorch implementation of StyleGAN2."/>
+
+    <title>Style GAN 2</title>
+    <link rel="shortcut icon" href="/icon.png"/>
+    <link rel="stylesheet" href="../../pylit.css">
+    <link rel="canonical" href="https://nn.labml.ai/gan/stylegan/index.html"/>
+    <!-- Global site tag (gtag.js) - Google Analytics -->
+    <script async src="https://www.googletagmanager.com/gtag/js?id=G-4V3HC8HBLH"></script>
+    <script>
+        window.dataLayer = window.dataLayer || [];
+
+        function gtag() {
+            dataLayer.push(arguments);
+        }
+
+        gtag('js', new Date());
+
+        gtag('config', 'G-4V3HC8HBLH');
+    </script>
+</head>
+<body>
+<div id='container'>
+    <div id="background"></div>
+    <div class='section'>
+        <div class='docs'>
+            <p>
+                <a class="parent" href="/">home</a>
+                <a class="parent" href="../index.html">gan</a>
+                <a class="parent" href="index.html">stylegan</a>
+            </p>
+            <p>
+
+                <a href="https://github.com/lab-ml/labml_nn/tree/master/labml_nn/gan/stylegan/__init__.py">
+                    <img alt="Github"
+                         src="https://img.shields.io/github/stars/lab-ml/nn?style=social"
+                         style="max-width:100%;"/></a>
+                <a href="https://join.slack.com/t/labforml/shared_invite/zt-egj9zvq9-Dl3hhZqobexgT7aVKnD14g/"
+                   rel="nofollow">
+                    <img alt="Join Slact"
+                         src="https://img.shields.io/badge/slack-chat-green.svg?logo=slack"
+                         style="max-width:100%;"/></a>
+                <a href="https://twitter.com/labmlai"
+                   rel="nofollow">
+                    <img alt="Twitter"
+                         src="https://img.shields.io/twitter/follow/labmlai?style=social"
+                         style="max-width:100%;"/></a>
+            </p>
+        </div>
+    </div>
+    <div class='section' id='section-0'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-0'>#</a>
+                </div>
+                <h1>Style GAN 2</h1>
+<p>This is a <a href="https://pytorch.org">PyTorch</a> implementation of the paper
+ <a href="https://arxiv.org/abs/1912.04958">Analyzing and Improving the Image Quality of StyleGAN</a>
+ which introduces <strong>Style GAN2</strong>.
+Style GAN2 is an improvement over <strong>Style GAN</strong> from the paper
+ <a href="https://arxiv.org/abs/1812.04948">A Style-Based Generator Architecture for Generative Adversarial Networks</a>.
+And Style GAN is based on <strong>Progressive GAN</strong> from the paper
+ <a href="https://arxiv.org/abs/1710.10196">Progressive Growing of GANs for Improved Quality, Stability, and Variation</a>.
+All three papers are from the same authors from <a href="https://twitter.com/NVIDIAAI">NVIDIA AI</a>.</p>
+<p><em>Our implementation is a minimalistic Style GAN2 model training code.
+Only single GPU training is supported to keep the implementation simple.
+We managed to shrink it to keep it at less than 500 lines of code, including the training loop.</em></p>
+<p><strong>🏃 Here&rsquo;s the training code: <a href="experiment.html"><code>experiment.py</code></a>.</strong></p>
+<p><img alt="Generated Images" src="generated_64.png" /></p>
+<p><em><small>These are $64 \times 64$ images generated after training for about 80K steps.</small></em></p>
+<p>We&rsquo;ll first introduce the three papers at a high level.</p>
+<h2>Generative Adversarial Networks</h2>
+<p>Generative adversarial networks have two components; the generator and the discriminator.
+The generator network takes a random latent vector ($z \in \mathcal{Z}$)
+ and tries to generate a realistic image.
+The discriminator network tries to differentiate the real images from generated images.
+When we train the two networks together the generator starts generating images indistinguishable from real images.</p>
+<h2>Progressive GAN</h2>
+<p>Progressive GAN generates high-resolution images ($1080 \times 1080$) of size.
+It does so by <em>progressively</em> increasing the image size.
+First, it trains a network that produces a $4 \times 4$ image, then $8 \times 8$ ,
+ then an $16 \times 16$  image, and so on up to the desired image resolution.</p>
+<p>At each resolution, the generator network produces an image in latent space which is converted into RGB,
+with a $1 \times 1$  convolution.
+When we progress from a lower resolution to a higher resolution
+ (say from $4 \times 4$  to $8 \times 8$ ) we scale the latent image by $2\times$
+ and add a new block (two $3 \times 3$  convolution layers)
+ and a new $1 \times 1$  layer to get RGB.
+The transition is done smoothly by adding a residual connection to
+ the $2\times$ scaled $4 \times 4$  RGB image.
+The weight of this residual connection is slowly reduced, to let the new block take over.</p>
+<p>The discriminator is a mirror image of the generator network.
+The progressive growth of the discriminator is done similarly.</p>
+<p><img alt="progressive_gan.svg" src="progressive_gan.svg" /></p>
+<p><em><small>$2\times$ and $0.5\times$ denote feature map resolution scaling and scaling.
+$4\times4$, $8\times4$, &hellip; denote feature map resolution at the generator or discriminator block.
+Each discriminator and generator block consists of 2 convolution layers with leaky ReLU activations.</small></em></p>
+<p>They use <strong>minibatch standard deviation</strong> to increase variation and
+ <strong>equalized learning rate</strong> which we discussed below in the implementation.
+They also use <strong>pixel-wise normalization</strong> where at each pixel the feature vector is normalized.
+They apply this to all the convolution layer outputs (except RGB).</p>
+<h2>Style GAN</h2>
+<p>Style GAN improves the generator of Progressive GAN keeping the discriminator architecture the same.</p>
+<h4>Mapping Network</h4>
+<p>It maps the random latent vector ($z \in \mathcal{Z}$)
+ into a different latent space ($w \in \mathcal{W}$),
+ with an 8-layer neural network.
+This gives an intermediate latent space $\mathcal{W}$
+where the factors of variations are more linear (disentangled).</p>
+<h4>AdaIN</h4>
+<p>Then $w$ is transformed into two vectors (<strong><em>styles</em></strong>) per layer,
+ $i$, $y_i = (y_{s,i}, y_{b,i}) = f_{A_i}(w)$ and used for scaling and shifting (biasing)
+ in each layer with $\text{AdaIN}$ operator (normalize and scale):
+<script type="math/tex; mode=display">\text{AdaIN}(x_i, y_i) = y_{s, i} \frac{x_i - \mu(x_i)}{\sigma(x_i)} + y_{b,i}</script>
+</p>
+<h4>Style Mixing</h4>
+<p>To prevent the generator from assuming adjacent styles are correlated,
+ they randomly use different styles for different blocks.
+That is, they sample two latent vectors $(z_1, z_2)$ and corresponding $(w_1, w_2)$ and
+ use $w_1$ based styles for some blocks and $w_2$ based styles for some blacks randomly.</p>
+<h4>Stochastic Variation</h4>
+<p>Noise is made available to each block which helps the generator create more realistic images.
+Noise is scaled per channel by a learned weight.</p>
+<h4>Bilinear Up and Down Sampling</h4>
+<p>All the up and down-sampling operations are accompanied by bilinear smoothing.</p>
+<p><img alt="style_gan.svg" src="style_gan.svg" /></p>
+<p><em><small>$A$ denotes a linear layer.
+$B$ denotes a broadcast and scaling operation (noise is a single channel).
+Style GAN also uses progressive growing like Progressive GAN</small></em></p>
+<h2>Style GAN 2</h2>
+<p>Style GAN 2 changes both the generator and the discriminator of Style GAN.</p>
+<h4>Weight Modulation and Demodulation</h4>
+<p>They remove the $\text{AdaIN}$ operator and replace it with
+ the weight modulation and demodulation step.
+This is supposed to improve what they call droplet artifacts that are present in generated images,
+ which are caused by the normalization in $\text{AdaIN}$ operator.
+Style vector per layer is calculated from $w_i \in \mathcal{W}$ as $s_i = f_{A_i}(w_i)$.</p>
+<p>Then the convolution weights $w$ are modulated as follows.
+($w$ here on refers to weights not intermediate latent space,
+ we are sticking to the same notation as the paper.)</p>
+<p>
+<script type="math/tex; mode=display">w'_{i, j, k} = s_i \cdot w_{i, j, k}</script>
+Then it&rsquo;s demodulated by normalizing,
+<script type="math/tex; mode=display">w''_{i,j,k} = \frac{w'_{i,j,k}}{\sqrt{\sum_{i,k}{w'_{i, j, k}}^2 + \epsilon}}</script>
+where $i$ is the input channel, $j$ is the output channel, and $k$ is the kernel index.</p>
+<h4>Path Length Regularization</h4>
+<p>Path length regularization encourages a fixed-size step in $\mathcal{W}$ to result in a non-zero,
+ fixed-magnitude change in the generated image.</p>
+<h4>No Progressive Growing</h4>
+<p>StyleGAN2 uses residual connections (with down-sampling) in the discriminator and skip connections
+ in the generator with up-sampling
+  (the RGB outputs from each layer are added - no residual connections in feature maps).
+They show that with experiments that the contribution of low-resolution layers is higher
+ at beginning of the training and then high-resolution layers take over.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">148</span><span></span><span class="kn">import</span> <span class="nn">math</span>
+<span class="lineno">149</span><span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Tuple</span><span class="p">,</span> <span class="n">Optional</span><span class="p">,</span> <span class="n">List</span>
+<span class="lineno">150</span>
+<span class="lineno">151</span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="lineno">152</span><span class="kn">import</span> <span class="nn">torch</span>
+<span class="lineno">153</span><span class="kn">import</span> <span class="nn">torch.nn.functional</span> <span class="k">as</span> <span class="nn">F</span>
+<span class="lineno">154</span><span class="kn">import</span> <span class="nn">torch.utils.data</span>
+<span class="lineno">155</span><span class="kn">from</span> <span class="nn">torch</span> <span class="kn">import</span> <span class="n">nn</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-1'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-1'>#</a>
+                </div>
+                <p><a id="mapping_network"></a></p>
+<h2>Mapping Network</h2>
+<p><img alt="Mapping Network" src="mapping_network.svg" /></p>
+<p>This is an MLP with 8 linear layers.
+The mapping network maps the latent vector $z \in \mathcal{W}$
+to an intermediate latent space $w \in \mathcal{W}$.
+$\mathcal{W}$ space will be disentangled from the image space
+where the factors of variation become more linear.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">158</span><span class="k">class</span> <span class="nc">MappingNetwork</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-2'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-2'>#</a>
+                </div>
+                <ul>
+<li><code>features</code> is the number of features in $z$ and $w$</li>
+<li><code>n_layers</code> is the number of layers in the mapping network.</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">172</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">n_layers</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-3'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-3'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">177</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-4'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-4'>#</a>
+                </div>
+                <p>Create the MLP</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">180</span>        <span class="n">layers</span> <span class="o">=</span> <span class="p">[]</span>
+<span class="lineno">181</span>        <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">n_layers</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-5'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-5'>#</a>
+                </div>
+                <p><a href="#equalized_linear">Equalized learning-rate linear layers</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">183</span>            <span class="n">layers</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">EqualizedLinear</span><span class="p">(</span><span class="n">features</span><span class="p">,</span> <span class="n">features</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-6'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-6'>#</a>
+                </div>
+                <p>Leaky Relu</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">185</span>            <span class="n">layers</span><span class="o">.</span><span class="n">append</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="n">negative_slope</span><span class="o">=</span><span class="mf">0.2</span><span class="p">,</span> <span class="n">inplace</span><span class="o">=</span><span class="kc">True</span><span class="p">))</span>
+<span class="lineno">186</span>
+<span class="lineno">187</span>        <span class="bp">self</span><span class="o">.</span><span class="n">net</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="o">*</span><span class="n">layers</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-7'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-7'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">189</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">z</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-8'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-8'>#</a>
+                </div>
+                <p>Normalize $z$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">191</span>        <span class="n">z</span> <span class="o">=</span> <span class="n">F</span><span class="o">.</span><span class="n">normalize</span><span class="p">(</span><span class="n">z</span><span class="p">,</span> <span class="n">dim</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-9'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-9'>#</a>
+                </div>
+                <p>Map $z$ to $w$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">193</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">net</span><span class="p">(</span><span class="n">z</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-10'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-10'>#</a>
+                </div>
+                <p><a id="generator"></a></p>
+<h2>StyleGAN2 Generator</h2>
+<p><img alt="Generator" src="style_gan2.svg" /></p>
+<p><em><small>$A$ denotes a linear layer.
+$B$ denotes a broadcast and scaling operation (noise is a single channel).
+<a href="#to_rgb"><em>toRGB</em></a> also has a style modulation which is not shown in the diagram to keep it simple.</small></em></p>
+<p>The generator starts with a learned constant.
+Then it has a series of blocks. The feature map resolution is doubled at each block
+Each block outputs an RGB image and they are scaled up and summed to get the final RGB image.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">196</span><span class="k">class</span> <span class="nc">Generator</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-11'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-11'>#</a>
+                </div>
+                <ul>
+<li><code>log_resolution</code> is the $\log_2$ of image resolution</li>
+<li><code>d_latent</code> is the dimensionality of $w$</li>
+<li><code>n_features</code> number of features in the convolution layer at the highest resolution (final block)</li>
+<li><code>max_features</code> maximum number of features in any generator block</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">212</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">log_resolution</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">d_latent</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">n_features</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">32</span><span class="p">,</span> <span class="n">max_features</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">512</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-12'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-12'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">219</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-13'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-13'>#</a>
+                </div>
+                <p>Calculate the number of features for each block</p>
+<p>Something like <code>[512, 512, 256, 128, 64, 32]</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">224</span>        <span class="n">features</span> <span class="o">=</span> <span class="p">[</span><span class="nb">min</span><span class="p">(</span><span class="n">max_features</span><span class="p">,</span> <span class="n">n_features</span> <span class="o">*</span> <span class="p">(</span><span class="mi">2</span> <span class="o">**</span> <span class="n">i</span><span class="p">))</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">log_resolution</span> <span class="o">-</span> <span class="mi">2</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-14'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-14'>#</a>
+                </div>
+                <p>Number of generator blocks</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">226</span>        <span class="bp">self</span><span class="o">.</span><span class="n">n_blocks</span> <span class="o">=</span> <span class="nb">len</span><span class="p">(</span><span class="n">features</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-15'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-15'>#</a>
+                </div>
+                <p>Trainable $4 \times 4$ constant</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">229</span>        <span class="bp">self</span><span class="o">.</span><span class="n">initial_constant</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="n">features</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="mi">4</span><span class="p">,</span> <span class="mi">4</span><span class="p">)))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-16'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-16'>#</a>
+                </div>
+                <p>First style block for $4 \times 4$ resolution and layer to get RGB</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">232</span>        <span class="bp">self</span><span class="o">.</span><span class="n">style_block</span> <span class="o">=</span> <span class="n">StyleBlock</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">features</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="n">features</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span>
+<span class="lineno">233</span>        <span class="bp">self</span><span class="o">.</span><span class="n">to_rgb</span> <span class="o">=</span> <span class="n">ToRGB</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">features</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-17'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-17'>#</a>
+                </div>
+                <p>Generator blocks</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">236</span>        <span class="n">blocks</span> <span class="o">=</span> <span class="p">[</span><span class="n">GeneratorBlock</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">features</span><span class="p">[</span><span class="n">i</span> <span class="o">-</span> <span class="mi">1</span><span class="p">],</span> <span class="n">features</span><span class="p">[</span><span class="n">i</span><span class="p">])</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">n_blocks</span><span class="p">)]</span>
+<span class="lineno">237</span>        <span class="bp">self</span><span class="o">.</span><span class="n">blocks</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">ModuleList</span><span class="p">(</span><span class="n">blocks</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-18'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-18'>#</a>
+                </div>
+                <p>$2 \times$ up sampling layer. The feature space is up sampled
+at each block</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">241</span>        <span class="bp">self</span><span class="o">.</span><span class="n">up_sample</span> <span class="o">=</span> <span class="n">UpSample</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-19'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-19'>#</a>
+                </div>
+                <ul>
+<li><code>w</code> is $w$. In order to mix-styles (use different $w$ for different layers), we provide a separate
+$w$ for each <a href="#generator_block">generator block</a>. It has shape `[n_blocks, batch_size, d_latent]1.</li>
+<li><code>input_noise</code> is the noise for each block.
+It&rsquo;s a list of pairs of noise sensors because each block (except the initial) has two noise inputs
+after each convolution layer (see the diagram).</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">243</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">w</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">input_noise</span><span class="p">:</span> <span class="n">List</span><span class="p">[</span><span class="n">Tuple</span><span class="p">[</span><span class="n">Optional</span><span class="p">[</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">],</span> <span class="n">Optional</span><span class="p">[</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">]]]):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-20'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-20'>#</a>
+                </div>
+                <p>Get batch size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">253</span>        <span class="n">batch_size</span> <span class="o">=</span> <span class="n">w</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-21'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-21'>#</a>
+                </div>
+                <p>Expand the learned constant to match batch size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">256</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">initial_constant</span><span class="o">.</span><span class="n">expand</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-22'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-22'>#</a>
+                </div>
+                <p>The first style block</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">259</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">style_block</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="n">input_noise</span><span class="p">[</span><span class="mi">0</span><span class="p">][</span><span class="mi">1</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-23'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-23'>#</a>
+                </div>
+                <p>Get first rgb image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">261</span>        <span class="n">rgb</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">to_rgb</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-24'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-24'>#</a>
+                </div>
+                <p>Evaluate rest of the blocks</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">264</span>        <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">n_blocks</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-25'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-25'>#</a>
+                </div>
+                <p>Up sample the feature map</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">266</span>            <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">up_sample</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-26'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-26'>#</a>
+                </div>
+                <p>Run it through the <a href="#generator_block">generator block</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">268</span>            <span class="n">x</span><span class="p">,</span> <span class="n">rgb_new</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">blocks</span><span class="p">[</span><span class="n">i</span> <span class="o">-</span> <span class="mi">1</span><span class="p">](</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">[</span><span class="n">i</span><span class="p">],</span> <span class="n">input_noise</span><span class="p">[</span><span class="n">i</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-27'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-27'>#</a>
+                </div>
+                <p>Up sample the RGB image and add to the rgb from the block</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">270</span>            <span class="n">rgb</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">up_sample</span><span class="p">(</span><span class="n">rgb</span><span class="p">)</span> <span class="o">+</span> <span class="n">rgb_new</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-28'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-28'>#</a>
+                </div>
+                <p>Return the final RGB image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">273</span>        <span class="k">return</span> <span class="n">rgb</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-29'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-29'>#</a>
+                </div>
+                <p><a id="generator_block"></a></p>
+<h3>Generator Block</h3>
+<p><img alt="Generator block" src="generator_block.svg" /></p>
+<p><em><small>$A$ denotes a linear layer.
+$B$ denotes a broadcast and scaling operation (noise is a single channel).
+<a href="#to_rgb"><em>toRGB</em></a> also has a style modulation which is not shown in the diagram to keep it simple.</small></em></p>
+<p>The generator block consists of two <a href="#style_block">style blocks</a> ($3 \times 3$ convolutions with style modulation)
+and an RGB output.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">276</span><span class="k">class</span> <span class="nc">GeneratorBlock</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-30'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-30'>#</a>
+                </div>
+                <ul>
+<li><code>d_latent</code> is the dimensionality of $w$</li>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">291</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">d_latent</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">in_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">out_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-31'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-31'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">297</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-32'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-32'>#</a>
+                </div>
+                <p>First <a href="#style_block">style block</a> changes the feature map size to <code>out_features</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">300</span>        <span class="bp">self</span><span class="o">.</span><span class="n">style_block1</span> <span class="o">=</span> <span class="n">StyleBlock</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-33'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-33'>#</a>
+                </div>
+                <p>Second <a href="#style_block">style block</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">302</span>        <span class="bp">self</span><span class="o">.</span><span class="n">style_block2</span> <span class="o">=</span> <span class="n">StyleBlock</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">out_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-34'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-34'>#</a>
+                </div>
+                <p><em>toRGB</em> layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">305</span>        <span class="bp">self</span><span class="o">.</span><span class="n">to_rgb</span> <span class="o">=</span> <span class="n">ToRGB</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">out_features</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-35'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-35'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the input feature map of shape <code>[batch_size, in_features, height, width]</code></li>
+<li><code>w</code> is $w$ with shape <code>[batch_size, d_latent]</code></li>
+<li><code>noise</code> is a tuple of two noise tensors of shape <code>[batch_size, 1, height, width]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">307</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">w</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">noise</span><span class="p">:</span> <span class="n">Tuple</span><span class="p">[</span><span class="n">Optional</span><span class="p">[</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">],</span> <span class="n">Optional</span><span class="p">[</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">]]):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-36'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-36'>#</a>
+                </div>
+                <p>First style block with first noise tensor.
+The output is of shape <code>[batch_size, out_features, height, width]</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">315</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">style_block1</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">,</span> <span class="n">noise</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-37'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-37'>#</a>
+                </div>
+                <p>Second style block with second noise tensor.
+The output is of shape <code>[batch_size, out_features, height, width]</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">318</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">style_block2</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">,</span> <span class="n">noise</span><span class="p">[</span><span class="mi">1</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-38'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-38'>#</a>
+                </div>
+                <p>Get RGB image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">321</span>        <span class="n">rgb</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">to_rgb</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-39'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-39'>#</a>
+                </div>
+                <p>Return feature map and rgb image</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">324</span>        <span class="k">return</span> <span class="n">x</span><span class="p">,</span> <span class="n">rgb</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-40'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-40'>#</a>
+                </div>
+                <p><a id="style_block"></a></p>
+<h3>Style Block</h3>
+<p><img alt="Style block" src="style_block.svg" /></p>
+<p><em><small>$A$ denotes a linear layer.
+$B$ denotes a broadcast and scaling operation (noise is single channel).</small></em></p>
+<p>Style block has a weight modulation convolution layer.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">327</span><span class="k">class</span> <span class="nc">StyleBlock</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-41'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-41'>#</a>
+                </div>
+                <ul>
+<li><code>d_latent</code> is the dimensionality of $w$</li>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">340</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">d_latent</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">in_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">out_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-42'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-42'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">346</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-43'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-43'>#</a>
+                </div>
+                <p>Get style vector from $w$ (denoted by $A$ in the diagram) with
+an <a href="#equalized_linear">equalized learning-rate linear layer</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">349</span>        <span class="bp">self</span><span class="o">.</span><span class="n">to_style</span> <span class="o">=</span> <span class="n">EqualizedLinear</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">bias</span><span class="o">=</span><span class="mf">1.0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-44'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-44'>#</a>
+                </div>
+                <p>Weight modulated convolution layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">351</span>        <span class="bp">self</span><span class="o">.</span><span class="n">conv</span> <span class="o">=</span> <span class="n">Conv2dWeightModulate</span><span class="p">(</span><span class="n">in_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="o">=</span><span class="mi">3</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-45'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-45'>#</a>
+                </div>
+                <p>Noise scale</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">353</span>        <span class="bp">self</span><span class="o">.</span><span class="n">scale_noise</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="mi">1</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-46'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-46'>#</a>
+                </div>
+                <p>Bias</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">355</span>        <span class="bp">self</span><span class="o">.</span><span class="n">bias</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">out_features</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-47'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-47'>#</a>
+                </div>
+                <p>Activation function</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">358</span>        <span class="bp">self</span><span class="o">.</span><span class="n">activation</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="mf">0.2</span><span class="p">,</span> <span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-48'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-48'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the input feature map of shape <code>[batch_size, in_features, height, width]</code></li>
+<li><code>w</code> is $w$ with shape <code>[batch_size, d_latent]</code></li>
+<li><code>noise</code> is a tensor of shape <code>[batch_size, 1, height, width]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">360</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">w</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">noise</span><span class="p">:</span> <span class="n">Optional</span><span class="p">[</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">]):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-49'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-49'>#</a>
+                </div>
+                <p>Get style vector $s$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">367</span>        <span class="n">s</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">to_style</span><span class="p">(</span><span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-50'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-50'>#</a>
+                </div>
+                <p>Weight modulated convolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">369</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">conv</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">s</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-51'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-51'>#</a>
+                </div>
+                <p>Scale and add noise</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">371</span>        <span class="k">if</span> <span class="n">noise</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
+<span class="lineno">372</span>            <span class="n">x</span> <span class="o">=</span> <span class="n">x</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale_noise</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="kc">None</span><span class="p">,</span> <span class="kc">None</span><span class="p">]</span> <span class="o">*</span> <span class="n">noise</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-52'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-52'>#</a>
+                </div>
+                <p>Add bias and evaluate activation function</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">374</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">activation</span><span class="p">(</span><span class="n">x</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">bias</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="kc">None</span><span class="p">,</span> <span class="kc">None</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-53'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-53'>#</a>
+                </div>
+                <p><a id="to_rgb"></a></p>
+<h3>To RGB</h3>
+<p><img alt="To RGB" src="to_rgb.svg" /></p>
+<p><em><small>$A$ denotes a linear layer.</small></em></p>
+<p>Generates an RGB image from a feature map using $1 \times 1$ convolution.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">377</span><span class="k">class</span> <span class="nc">ToRGB</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-54'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-54'>#</a>
+                </div>
+                <ul>
+<li><code>d_latent</code> is the dimensionality of $w$</li>
+<li><code>features</code> is the number of features in the feature map</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">389</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">d_latent</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">features</span><span class="p">:</span> <span class="nb">int</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-55'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-55'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">394</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-56'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-56'>#</a>
+                </div>
+                <p>Get style vector from $w$ (denoted by $A$ in the diagram) with
+an <a href="#equalized_linear">equalized learning-rate linear layer</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">397</span>        <span class="bp">self</span><span class="o">.</span><span class="n">to_style</span> <span class="o">=</span> <span class="n">EqualizedLinear</span><span class="p">(</span><span class="n">d_latent</span><span class="p">,</span> <span class="n">features</span><span class="p">,</span> <span class="n">bias</span><span class="o">=</span><span class="mf">1.0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-57'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-57'>#</a>
+                </div>
+                <p>Weight modulated convolution layer without demodulation</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">400</span>        <span class="bp">self</span><span class="o">.</span><span class="n">conv</span> <span class="o">=</span> <span class="n">Conv2dWeightModulate</span><span class="p">(</span><span class="n">features</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="n">kernel_size</span><span class="o">=</span><span class="mi">1</span><span class="p">,</span> <span class="n">demodulate</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-58'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-58'>#</a>
+                </div>
+                <p>Bias</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">402</span>        <span class="bp">self</span><span class="o">.</span><span class="n">bias</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="mi">1</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-59'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-59'>#</a>
+                </div>
+                <p>Activation function</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">404</span>        <span class="bp">self</span><span class="o">.</span><span class="n">activation</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="mf">0.2</span><span class="p">,</span> <span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-60'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-60'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the input feature map of shape <code>[batch_size, in_features, height, width]</code></li>
+<li><code>w</code> is $w$ with shape <code>[batch_size, d_latent]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">406</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">w</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-61'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-61'>#</a>
+                </div>
+                <p>Get style vector $s$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">412</span>        <span class="n">style</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">to_style</span><span class="p">(</span><span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-62'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-62'>#</a>
+                </div>
+                <p>Weight modulated convolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">414</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">conv</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">style</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-63'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-63'>#</a>
+                </div>
+                <p>Add bias and evaluate activation function</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">416</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">activation</span><span class="p">(</span><span class="n">x</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">bias</span><span class="p">[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="kc">None</span><span class="p">,</span> <span class="kc">None</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-64'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-64'>#</a>
+                </div>
+                <h3>Convolution with Weight Modulation and Demodulation</h3>
+<p>This layer scales the convolution weights by the style vector and demodulates by normalizing it.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">419</span><span class="k">class</span> <span class="nc">Conv2dWeightModulate</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-65'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-65'>#</a>
+                </div>
+                <ul>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+<li><code>kernel_size</code> is the size of the convolution kernel</li>
+<li><code>demodulate</code> is flag whether to normalize weights by its standard deviation</li>
+<li><code>eps</code> is the $\epsilon$ for normalizing</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">426</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">in_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">out_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">kernel_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span>
+<span class="lineno">427</span>                 <span class="n">demodulate</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="kc">True</span><span class="p">,</span> <span class="n">eps</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">1e-8</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-66'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-66'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">435</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-67'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-67'>#</a>
+                </div>
+                <p>Number of output features</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">437</span>        <span class="bp">self</span><span class="o">.</span><span class="n">out_features</span> <span class="o">=</span> <span class="n">out_features</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-68'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-68'>#</a>
+                </div>
+                <p>Whether to normalize weights</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">439</span>        <span class="bp">self</span><span class="o">.</span><span class="n">demodulate</span> <span class="o">=</span> <span class="n">demodulate</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-69'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-69'>#</a>
+                </div>
+                <p>Padding size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">441</span>        <span class="bp">self</span><span class="o">.</span><span class="n">padding</span> <span class="o">=</span> <span class="p">(</span><span class="n">kernel_size</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)</span> <span class="o">//</span> <span class="mi">2</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-70'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-70'>#</a>
+                </div>
+                <p><a href="#equalized_weight">Weights parameter with equalized learning rate</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">444</span>        <span class="bp">self</span><span class="o">.</span><span class="n">weight</span> <span class="o">=</span> <span class="n">EqualizedWeight</span><span class="p">([</span><span class="n">out_features</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="p">,</span> <span class="n">kernel_size</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-71'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-71'>#</a>
+                </div>
+                <p>$\epsilon$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">446</span>        <span class="bp">self</span><span class="o">.</span><span class="n">eps</span> <span class="o">=</span> <span class="n">eps</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-72'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-72'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the input feature map of shape <code>[batch_size, in_features, height, width]</code></li>
+<li><code>s</code> is style based scaling tensor of shape <code>[batch_size, in_features]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">448</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">s</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-73'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-73'>#</a>
+                </div>
+                <p>Get batch size, height and width</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">455</span>        <span class="n">b</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-74'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-74'>#</a>
+                </div>
+                <p>Reshape the scales</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">458</span>        <span class="n">s</span> <span class="o">=</span> <span class="n">s</span><span class="p">[:,</span> <span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="kc">None</span><span class="p">,</span> <span class="kc">None</span><span class="p">]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-75'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-75'>#</a>
+                </div>
+                <p>Get <a href="#equalized_weight">learning rate equalized weights</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">460</span>        <span class="n">weights</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">weight</span><span class="p">()[</span><span class="kc">None</span><span class="p">,</span> <span class="p">:,</span> <span class="p">:,</span> <span class="p">:,</span> <span class="p">:]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-76'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-76'>#</a>
+                </div>
+                <p>
+<script type="math/tex; mode=display">w`_{i,j,k} = s_i * w_{i,j,k}</script>
+where $i$ is the input channel, $j$ is the output channel, and $k$ is the kernel index.</p>
+<p>The result has shape <code>[batch_size, out_features, in_features, kernel_size, kernel_size]</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">465</span>        <span class="n">weights</span> <span class="o">=</span> <span class="n">weights</span> <span class="o">*</span> <span class="n">s</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-77'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-77'>#</a>
+                </div>
+                <p>Demodulate</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">468</span>        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">demodulate</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-78'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-78'>#</a>
+                </div>
+                <p>
+<script type="math/tex; mode=display">\sigma_j = \sqrt{\sum_{i,k} (w'_{i, j, k})^2 + \epsilon}</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">470</span>            <span class="n">sigma_inv</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">rsqrt</span><span class="p">((</span><span class="n">weights</span> <span class="o">**</span> <span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="n">dim</span><span class="o">=</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">4</span><span class="p">),</span> <span class="n">keepdim</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">eps</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-79'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-79'>#</a>
+                </div>
+                <p>
+<script type="math/tex; mode=display">w''_{i,j,k} = \frac{w'_{i,j,k}}{\sqrt{\sum_{i,k} (w'_{i, j, k})^2 + \epsilon}}</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">472</span>            <span class="n">weights</span> <span class="o">=</span> <span class="n">weights</span> <span class="o">*</span> <span class="n">sigma_inv</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-80'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-80'>#</a>
+                </div>
+                <p>Reshape <code>x</code></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">475</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-81'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-81'>#</a>
+                </div>
+                <p>Reshape weights</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">478</span>        <span class="n">_</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="o">*</span><span class="n">ws</span> <span class="o">=</span> <span class="n">weights</span><span class="o">.</span><span class="n">shape</span>
+<span class="lineno">479</span>        <span class="n">weights</span> <span class="o">=</span> <span class="n">weights</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="n">b</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">out_features</span><span class="p">,</span> <span class="o">*</span><span class="n">ws</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-82'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-82'>#</a>
+                </div>
+                <p>Use grouped convolution to efficiently calculate the convolution with sample wise kernel.
+i.e. we have a different kernel (weights) for each sample in the batch</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">483</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">F</span><span class="o">.</span><span class="n">conv2d</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="n">weights</span><span class="p">,</span> <span class="n">padding</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">padding</span><span class="p">,</span> <span class="n">groups</span><span class="o">=</span><span class="n">b</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-83'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-83'>#</a>
+                </div>
+                <p>Reshape <code>x</code> to <code>[batch_size, out_features, height, width]</code> and return</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">486</span>        <span class="k">return</span> <span class="n">x</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">out_features</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-84'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-84'>#</a>
+                </div>
+                <p><a id="discriminator"></a></p>
+<h2>Style GAN2 Discriminator</h2>
+<p><img alt="Discriminator" src="style_gan2_disc.svg" /></p>
+<p>Discriminator first transforms the image to a feature map of the same resolution and then
+runs it through a series of blocks with residual connections.
+The resolution is down-sampled by $2 \times$ at each block while doubling the
+number of features.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">489</span><span class="k">class</span> <span class="nc">Discriminator</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-85'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-85'>#</a>
+                </div>
+                <ul>
+<li><code>log_resolution</code> is the $\log_2$ of image resolution</li>
+<li><code>n_features</code> number of features in the convolution layer at the highest resolution (first block)</li>
+<li><code>max_features</code> maximum number of features in any generator block</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">502</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">log_resolution</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">n_features</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="n">max_features</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">512</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-86'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-86'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">508</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-87'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-87'>#</a>
+                </div>
+                <p>Layer to convert RGB image to a feature map with <code>n_features</code> number of features.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">511</span>        <span class="bp">self</span><span class="o">.</span><span class="n">from_rgb</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span>
+<span class="lineno">512</span>            <span class="n">EqualizedConv2d</span><span class="p">(</span><span class="mi">3</span><span class="p">,</span> <span class="n">n_features</span><span class="p">,</span> <span class="mi">1</span><span class="p">),</span>
+<span class="lineno">513</span>            <span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="mf">0.2</span><span class="p">,</span> <span class="kc">True</span><span class="p">),</span>
+<span class="lineno">514</span>        <span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-88'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-88'>#</a>
+                </div>
+                <p>Calculate the number of features for each block.</p>
+<p>Something like <code>[64, 128, 256, 512, 512, 512]</code>.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">519</span>        <span class="n">features</span> <span class="o">=</span> <span class="p">[</span><span class="nb">min</span><span class="p">(</span><span class="n">max_features</span><span class="p">,</span> <span class="n">n_features</span> <span class="o">*</span> <span class="p">(</span><span class="mi">2</span> <span class="o">**</span> <span class="n">i</span><span class="p">))</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">log_resolution</span> <span class="o">-</span> <span class="mi">1</span><span class="p">)]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-89'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-89'>#</a>
+                </div>
+                <p>Number of <a href="#discriminator_block">discirminator blocks</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">521</span>        <span class="n">n_blocks</span> <span class="o">=</span> <span class="nb">len</span><span class="p">(</span><span class="n">features</span><span class="p">)</span> <span class="o">-</span> <span class="mi">1</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-90'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-90'>#</a>
+                </div>
+                <p>Discriminator blocks</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">523</span>        <span class="n">blocks</span> <span class="o">=</span> <span class="p">[</span><span class="n">DiscriminatorBlock</span><span class="p">(</span><span class="n">features</span><span class="p">[</span><span class="n">i</span><span class="p">],</span> <span class="n">features</span><span class="p">[</span><span class="n">i</span> <span class="o">+</span> <span class="mi">1</span><span class="p">])</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">n_blocks</span><span class="p">)]</span>
+<span class="lineno">524</span>        <span class="bp">self</span><span class="o">.</span><span class="n">blocks</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="o">*</span><span class="n">blocks</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-91'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-91'>#</a>
+                </div>
+                <p><a href="#mini_batch_std_dev">Mini-batch Standard Deviation</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">527</span>        <span class="bp">self</span><span class="o">.</span><span class="n">std_dev</span> <span class="o">=</span> <span class="n">MiniBatchStdDev</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-92'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-92'>#</a>
+                </div>
+                <p>Number of features after adding the standard deviations map</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">529</span>        <span class="n">final_features</span> <span class="o">=</span> <span class="n">features</span><span class="p">[</span><span class="o">-</span><span class="mi">1</span><span class="p">]</span> <span class="o">+</span> <span class="mi">1</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-93'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-93'>#</a>
+                </div>
+                <p>Final $3 \times 3$ convolution layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">531</span>        <span class="bp">self</span><span class="o">.</span><span class="n">conv</span> <span class="o">=</span> <span class="n">EqualizedConv2d</span><span class="p">(</span><span class="n">final_features</span><span class="p">,</span> <span class="n">final_features</span><span class="p">,</span> <span class="mi">3</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-94'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-94'>#</a>
+                </div>
+                <p>Final linear layer to get the classification</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">533</span>        <span class="bp">self</span><span class="o">.</span><span class="n">final</span> <span class="o">=</span> <span class="n">EqualizedLinear</span><span class="p">(</span><span class="mi">2</span> <span class="o">*</span> <span class="mi">2</span> <span class="o">*</span> <span class="n">final_features</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-95'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-95'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the input image of shape <code>[batch_size, 3, height, width]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">535</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-96'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-96'>#</a>
+                </div>
+                <p>Try to normalize the image (this is totally optional, but sped up the early training a little)</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">541</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">x</span> <span class="o">-</span> <span class="mf">0.5</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-97'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-97'>#</a>
+                </div>
+                <p>Convert from RGB</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">543</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">from_rgb</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-98'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-98'>#</a>
+                </div>
+                <p>Run through the <a href="#discriminator_block">discriminator blocks</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">545</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">blocks</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-99'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-99'>#</a>
+                </div>
+                <p>Calculate and append <a href="#mini_batch_std_dev">mini-batch standard deviation</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">548</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">std_dev</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-100'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-100'>#</a>
+                </div>
+                <p>$3 \times 3$ convolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">550</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">conv</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-101'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-101'>#</a>
+                </div>
+                <p>Flatten</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">552</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-102'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-102'>#</a>
+                </div>
+                <p>Return the classification score</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">554</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">final</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-103'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-103'>#</a>
+                </div>
+                <p><a id="discriminator_black"></a></p>
+<h3>Discriminator Block</h3>
+<p><img alt="Discriminator block" src="discriminator_block.svg" /></p>
+<p>Discriminator block consists of two $3 \times 3$ convolutions with a residual connection.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">557</span><span class="k">class</span> <span class="nc">DiscriminatorBlock</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-104'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-104'>#</a>
+                </div>
+                <ul>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">567</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-105'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-105'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">572</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-106'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-106'>#</a>
+                </div>
+                <p>Down-sampling and $1 \times 1$ convolution layer for the residual connection</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">574</span>        <span class="bp">self</span><span class="o">.</span><span class="n">residual</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span><span class="n">DownSample</span><span class="p">(),</span>
+<span class="lineno">575</span>                                      <span class="n">EqualizedConv2d</span><span class="p">(</span><span class="n">in_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="o">=</span><span class="mi">1</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-107'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-107'>#</a>
+                </div>
+                <p>Two $3 \times 3$ convolutions</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">578</span>        <span class="bp">self</span><span class="o">.</span><span class="n">block</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span>
+<span class="lineno">579</span>            <span class="n">EqualizedConv2d</span><span class="p">(</span><span class="n">in_features</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span> <span class="n">padding</span><span class="o">=</span><span class="mi">1</span><span class="p">),</span>
+<span class="lineno">580</span>            <span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="mf">0.2</span><span class="p">,</span> <span class="kc">True</span><span class="p">),</span>
+<span class="lineno">581</span>            <span class="n">EqualizedConv2d</span><span class="p">(</span><span class="n">in_features</span><span class="p">,</span> <span class="n">out_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span> <span class="n">padding</span><span class="o">=</span><span class="mi">1</span><span class="p">),</span>
+<span class="lineno">582</span>            <span class="n">nn</span><span class="o">.</span><span class="n">LeakyReLU</span><span class="p">(</span><span class="mf">0.2</span><span class="p">,</span> <span class="kc">True</span><span class="p">),</span>
+<span class="lineno">583</span>        <span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-108'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-108'>#</a>
+                </div>
+                <p>Down-sampling layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">586</span>        <span class="bp">self</span><span class="o">.</span><span class="n">down_sample</span> <span class="o">=</span> <span class="n">DownSample</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-109'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-109'>#</a>
+                </div>
+                <p>Scaling factor $\frac{1}{\sqrt 2}$ after adding the residual</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">589</span>        <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">/</span> <span class="n">math</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="mi">2</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-110'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-110'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">591</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-111'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-111'>#</a>
+                </div>
+                <p>Get the residual connection</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">593</span>        <span class="n">residual</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">residual</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-112'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-112'>#</a>
+                </div>
+                <p>Convolutions</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">596</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">block</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-113'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-113'>#</a>
+                </div>
+                <p>Down-sample</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">598</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">down_sample</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-114'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-114'>#</a>
+                </div>
+                <p>Add the residual and scale</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">601</span>        <span class="k">return</span> <span class="p">(</span><span class="n">x</span> <span class="o">+</span> <span class="n">residual</span><span class="p">)</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-115'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-115'>#</a>
+                </div>
+                <p><a id="mini_batch_std_dev"></a></p>
+<h3>Mini-batch Standard Deviation</h3>
+<p>Mini-batch standard deviation calculates the standard deviation
+across a mini-batch (or a subgroups within the mini-batch)
+for each feature in the feature map. Then it takes the mean of all
+the standard deviations and appends it to the feature map as one extra feature.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">604</span><span class="k">class</span> <span class="nc">MiniBatchStdDev</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-116'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-116'>#</a>
+                </div>
+                <ul>
+<li><code>group_size</code> is the number of samples to calculate standard deviation across.</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">616</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">group_size</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">4</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-117'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-117'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">620</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span>
+<span class="lineno">621</span>        <span class="bp">self</span><span class="o">.</span><span class="n">group_size</span> <span class="o">=</span> <span class="n">group_size</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-118'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-118'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is the feature map</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">623</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-119'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-119'>#</a>
+                </div>
+                <p>Check if the batch size is divisible by the group size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">628</span>        <span class="k">assert</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">group_size</span> <span class="o">==</span> <span class="mi">0</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-120'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-120'>#</a>
+                </div>
+                <p>Split the samples into groups of <code>group_size</code>, we flatten the feature map to a single dimension
+since we want to calculate the standard deviation for each feature.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">631</span>        <span class="n">grouped</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">view</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">group_size</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-121'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-121'>#</a>
+                </div>
+                <p>Calculate the standard deviation for each feature among <code>group_size</code> samples
+<script type="math/tex; mode=display">\mu_{i} = \frac{1}{N} \sum_g x_{g,i} \\
+  \sigma_{i} = \sqrt{\frac{1}{N} \sum_g (x_{g,i} - \mu_i)^2  + \epsilon}</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">635</span>        <span class="n">std</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">grouped</span><span class="o">.</span><span class="n">var</span><span class="p">(</span><span class="n">dim</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span> <span class="o">+</span> <span class="mf">1e-8</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-122'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-122'>#</a>
+                </div>
+                <p>Get the mean standard deviation</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">637</span>        <span class="n">std</span> <span class="o">=</span> <span class="n">std</span><span class="o">.</span><span class="n">mean</span><span class="p">()</span><span class="o">.</span><span class="n">view</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-123'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-123'>#</a>
+                </div>
+                <p>Expand the standard deviation to append to the feature map</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">639</span>        <span class="n">b</span><span class="p">,</span> <span class="n">_</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span>
+<span class="lineno">640</span>        <span class="n">std</span> <span class="o">=</span> <span class="n">std</span><span class="o">.</span><span class="n">expand</span><span class="p">(</span><span class="n">b</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-124'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-124'>#</a>
+                </div>
+                <p>Append (concatenate) the standard deviations to the feature map</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">642</span>        <span class="k">return</span> <span class="n">torch</span><span class="o">.</span><span class="n">cat</span><span class="p">([</span><span class="n">x</span><span class="p">,</span> <span class="n">std</span><span class="p">],</span> <span class="n">dim</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-125'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-125'>#</a>
+                </div>
+                <p><a id="down_sample"></a></p>
+<h3>Down-sample</h3>
+<p>The down-sample operation <a href="#smooth">smoothens</a> each feature channel and
+ scale $2 \times$ using bilinear interpolation.
+This is based on the paper
+ <a href="https://arxiv.org/abs/1904.11486">Making Convolutional Networks Shift-Invariant Again</a>.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">645</span><span class="k">class</span> <span class="nc">DownSample</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-126'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-126'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">656</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
+<span class="lineno">657</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-127'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-127'>#</a>
+                </div>
+                <p>Smoothing layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">659</span>        <span class="bp">self</span><span class="o">.</span><span class="n">smooth</span> <span class="o">=</span> <span class="n">Smooth</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-128'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-128'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">661</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-129'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-129'>#</a>
+                </div>
+                <p>Smoothing or blurring</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">663</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">smooth</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-130'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-130'>#</a>
+                </div>
+                <p>Scaled down</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">665</span>        <span class="k">return</span> <span class="n">F</span><span class="o">.</span><span class="n">interpolate</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="p">(</span><span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span> <span class="o">//</span> <span class="mi">2</span><span class="p">,</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span> <span class="o">//</span> <span class="mi">2</span><span class="p">),</span> <span class="n">mode</span><span class="o">=</span><span class="s1">&#39;bilinear&#39;</span><span class="p">,</span> <span class="n">align_corners</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-131'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-131'>#</a>
+                </div>
+                <p><a id="up_sample"></a></p>
+<h3>Up-sample</h3>
+<p>The up-sample operation scales the image up by $2 \times$ and <a href="#smooth">smoothens</a> each feature channel.
+This is based on the paper
+ <a href="https://arxiv.org/abs/1904.11486">Making Convolutional Networks Shift-Invariant Again</a>.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">668</span><span class="k">class</span> <span class="nc">UpSample</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-132'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-132'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">678</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
+<span class="lineno">679</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-133'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-133'>#</a>
+                </div>
+                <p>Up-sampling layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">681</span>        <span class="bp">self</span><span class="o">.</span><span class="n">up_sample</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Upsample</span><span class="p">(</span><span class="n">scale_factor</span><span class="o">=</span><span class="mi">2</span><span class="p">,</span> <span class="n">mode</span><span class="o">=</span><span class="s1">&#39;bilinear&#39;</span><span class="p">,</span> <span class="n">align_corners</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-134'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-134'>#</a>
+                </div>
+                <p>Smoothing layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">683</span>        <span class="bp">self</span><span class="o">.</span><span class="n">smooth</span> <span class="o">=</span> <span class="n">Smooth</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-135'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-135'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">685</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-136'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-136'>#</a>
+                </div>
+                <p>Up-sample and smoothen</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">687</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">smooth</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">up_sample</span><span class="p">(</span><span class="n">x</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-137'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-137'>#</a>
+                </div>
+                <p><a id="smooth"></a></p>
+<h3>Smoothing Layer</h3>
+<p>This layer blurs each channel</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">690</span><span class="k">class</span> <span class="nc">Smooth</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-138'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-138'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">698</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
+<span class="lineno">699</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-139'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-139'>#</a>
+                </div>
+                <p>Blurring kernel</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">701</span>        <span class="n">kernel</span> <span class="o">=</span> <span class="p">[[</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">,</span> <span class="mi">1</span><span class="p">],</span>
+<span class="lineno">702</span>                  <span class="p">[</span><span class="mi">2</span><span class="p">,</span> <span class="mi">4</span><span class="p">,</span> <span class="mi">2</span><span class="p">],</span>
+<span class="lineno">703</span>                  <span class="p">[</span><span class="mi">1</span><span class="p">,</span> <span class="mi">2</span><span class="p">,</span> <span class="mi">1</span><span class="p">]]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-140'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-140'>#</a>
+                </div>
+                <p>Convert the kernel to a PyTorch tensor</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">705</span>        <span class="n">kernel</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">tensor</span><span class="p">([[</span><span class="n">kernel</span><span class="p">]],</span> <span class="n">dtype</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">float</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-141'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-141'>#</a>
+                </div>
+                <p>Normalize the kernel</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">707</span>        <span class="n">kernel</span> <span class="o">/=</span> <span class="n">kernel</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-142'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-142'>#</a>
+                </div>
+                <p>Save kernel as a fixed parameter (no gradient updates)</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">709</span>        <span class="bp">self</span><span class="o">.</span><span class="n">kernel</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">kernel</span><span class="p">,</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-143'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-143'>#</a>
+                </div>
+                <p>Padding layer</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">711</span>        <span class="bp">self</span><span class="o">.</span><span class="n">pad</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">ReplicationPad2d</span><span class="p">(</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-144'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-144'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">713</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-145'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-145'>#</a>
+                </div>
+                <p>Get shape of the input feature map</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">715</span>        <span class="n">b</span><span class="p">,</span> <span class="n">c</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-146'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-146'>#</a>
+                </div>
+                <p>Reshape for smoothening</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">717</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">view</span><span class="p">(</span><span class="o">-</span><span class="mi">1</span><span class="p">,</span> <span class="mi">1</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-147'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-147'>#</a>
+                </div>
+                <p>Add padding</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">720</span>        <span class="n">x</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">pad</span><span class="p">(</span><span class="n">x</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-148'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-148'>#</a>
+                </div>
+                <p>Smoothen (blur) with the kernel</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">723</span>        <span class="n">x</span> <span class="o">=</span> <span class="n">F</span><span class="o">.</span><span class="n">conv2d</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">kernel</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-149'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-149'>#</a>
+                </div>
+                <p>Reshape and return</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">726</span>        <span class="k">return</span> <span class="n">x</span><span class="o">.</span><span class="n">view</span><span class="p">(</span><span class="n">b</span><span class="p">,</span> <span class="n">c</span><span class="p">,</span> <span class="n">h</span><span class="p">,</span> <span class="n">w</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-150'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-150'>#</a>
+                </div>
+                <p><a id="equalized_linear"></a></p>
+<h2>Learning-rate Equalized Linear Layer</h2>
+<p>This uses <a href="$equalized_weights">learning-rate equalized weights</a> for a linear layer.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">729</span><span class="k">class</span> <span class="nc">EqualizedLinear</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-151'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-151'>#</a>
+                </div>
+                <ul>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+<li><code>bias</code> is the bias initialization constant</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">737</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">in_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">out_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">bias</span><span class="p">:</span> <span class="nb">float</span> <span class="o">=</span> <span class="mf">0.</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-152'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-152'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">744</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-153'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-153'>#</a>
+                </div>
+                <p><a href="$equalized_weights">Learning-rate equalized weights</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">746</span>        <span class="bp">self</span><span class="o">.</span><span class="n">weight</span> <span class="o">=</span> <span class="n">EqualizedWeight</span><span class="p">([</span><span class="n">out_features</span><span class="p">,</span> <span class="n">in_features</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-154'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-154'>#</a>
+                </div>
+                <p>Bias</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">748</span>        <span class="bp">self</span><span class="o">.</span><span class="n">bias</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="n">out_features</span><span class="p">)</span> <span class="o">*</span> <span class="n">bias</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-155'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-155'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">750</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-156'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-156'>#</a>
+                </div>
+                <p>Linear transformation</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">752</span>        <span class="k">return</span> <span class="n">F</span><span class="o">.</span><span class="n">linear</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">weight</span><span class="p">(),</span> <span class="n">bias</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">bias</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-157'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-157'>#</a>
+                </div>
+                <p><a id="equalized_conv2d"></a></p>
+<h2>Learning-rate Equalized 2D Convolution Layer</h2>
+<p>This uses <a href="$equalized_weights">learning-rate equalized weights</a> for a convolution layer.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">755</span><span class="k">class</span> <span class="nc">EqualizedConv2d</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-158'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-158'>#</a>
+                </div>
+                <ul>
+<li><code>in_features</code> is the number of features in the input feature map</li>
+<li><code>out_features</code> is the number of features in the output feature map</li>
+<li><code>kernel_size</code> is the size of the convolution kernel</li>
+<li><code>padding</code> is the padding to be added on both sides of each size dimension</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">763</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">in_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">out_features</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span>
+<span class="lineno">764</span>                 <span class="n">kernel_size</span><span class="p">:</span> <span class="nb">int</span><span class="p">,</span> <span class="n">padding</span><span class="p">:</span> <span class="nb">int</span> <span class="o">=</span> <span class="mi">0</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-159'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-159'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">771</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-160'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-160'>#</a>
+                </div>
+                <p>Padding size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">773</span>        <span class="bp">self</span><span class="o">.</span><span class="n">padding</span> <span class="o">=</span> <span class="n">padding</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-161'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-161'>#</a>
+                </div>
+                <p><a href="$equalized_weights">Learning-rate equalized weights</a></p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">775</span>        <span class="bp">self</span><span class="o">.</span><span class="n">weight</span> <span class="o">=</span> <span class="n">EqualizedWeight</span><span class="p">([</span><span class="n">out_features</span><span class="p">,</span> <span class="n">in_features</span><span class="p">,</span> <span class="n">kernel_size</span><span class="p">,</span> <span class="n">kernel_size</span><span class="p">])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-162'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-162'>#</a>
+                </div>
+                <p>Bias</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">777</span>        <span class="bp">self</span><span class="o">.</span><span class="n">bias</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="n">out_features</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-163'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-163'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">779</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-164'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-164'>#</a>
+                </div>
+                <p>Convolution</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">781</span>        <span class="k">return</span> <span class="n">F</span><span class="o">.</span><span class="n">conv2d</span><span class="p">(</span><span class="n">x</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">weight</span><span class="p">(),</span> <span class="n">bias</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">bias</span><span class="p">,</span> <span class="n">padding</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">padding</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-165'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-165'>#</a>
+                </div>
+                <p><a id="equalized_weight"></a></p>
+<h2>Learning-rate Equalized Weights Parameter</h2>
+<p>This is based on equalized learning rate introduced in the Progressive GAN paper.
+Instead of initializing weights at $\mathcal{N}(0,c)$ they initialize weights
+to $\mathcal{N}(0, 1)$ and then multiply them by $c$ when using it.
+<script type="math/tex; mode=display">w_i = c \hat{w}_i</script>
+</p>
+<p>The gradients on stored parameters $\hat{w}$ get multiplied by $c$ but this doesn&rsquo;t have
+an affect since optimizers such as Adam normalize them by a running mean of the squared gradients.</p>
+<p>The optimizer updates on $\hat{w}$ are proportionate to the learning rate $\lambda$.
+But the effective weights $w$ get updated proportionately to $c \lambda$.
+Without equalized learning rate, the effective weights will get updated proportionately to just $\lambda$.</p>
+<p>So we are effectively scaling the learning rate by $c$ for these weight parameters.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">784</span><span class="k">class</span> <span class="nc">EqualizedWeight</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-166'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-166'>#</a>
+                </div>
+                <ul>
+<li><code>shape</code> is the shape of the weight parameter</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">804</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">shape</span><span class="p">:</span> <span class="n">List</span><span class="p">[</span><span class="nb">int</span><span class="p">]):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-167'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-167'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">808</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-168'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-168'>#</a>
+                </div>
+                <p>He initialization constant</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">811</span>        <span class="bp">self</span><span class="o">.</span><span class="n">c</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">/</span> <span class="n">math</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">prod</span><span class="p">(</span><span class="n">shape</span><span class="p">[</span><span class="mi">1</span><span class="p">:]))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-169'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-169'>#</a>
+                </div>
+                <p>Initialize the weights with $\mathcal{N}(0, 1)$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">813</span>        <span class="bp">self</span><span class="o">.</span><span class="n">weight</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">shape</span><span class="p">))</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-170'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-170'>#</a>
+                </div>
+                <p>Weight multiplication coefficient</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-171'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-171'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">816</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-172'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-172'>#</a>
+                </div>
+                <p>Multiply the weights by $c$ and return</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">818</span>        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">weight</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">c</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-173'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-173'>#</a>
+                </div>
+                <p><a id="gradient_penalty"></a></p>
+<h2>Gradient Penalty</h2>
+<p>This is the $R_1$ regularization penality from the paper
+<a href="https://arxiv.org/abs/1801.04406">Which Training Methods for GANs do actually Converge?</a>.</p>
+<p>
+<script type="math/tex; mode=display">R_1(\psi) = \frac{\gamma}{2} \mathbb{E}_{p_\mathcal{D}(x)}
+\Big[\Vert \nabla_x D_\psi(x)^2 \Vert\Big]</script>
+</p>
+<p>That is we try to reduce the L2 norm of gradients of the discriminator with
+respect to images, for real images ($P_\mathcal{D}$).</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">821</span><span class="k">class</span> <span class="nc">GradientPenalty</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-174'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-174'>#</a>
+                </div>
+                <ul>
+<li><code>x</code> is $x \sim \mathcal{D}$</li>
+<li><code>d</code> is $D(x)$</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">836</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">d</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-175'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-175'>#</a>
+                </div>
+                <p>Get batch size</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">843</span>        <span class="n">batch_size</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-176'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-176'>#</a>
+                </div>
+                <p>Calculate gradients of $D(x)$ with respect to $x$.
+<code>grad_outputs</code> is set to $1$ since we want the gradients of $D(x)$,
+and we need to create and retain graph since we have to compute gradients
+with respect to weight on this loss.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">849</span>        <span class="n">gradients</span><span class="p">,</span> <span class="o">*</span><span class="n">_</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">autograd</span><span class="o">.</span><span class="n">grad</span><span class="p">(</span><span class="n">outputs</span><span class="o">=</span><span class="n">d</span><span class="p">,</span>
+<span class="lineno">850</span>                                            <span class="n">inputs</span><span class="o">=</span><span class="n">x</span><span class="p">,</span>
+<span class="lineno">851</span>                                            <span class="n">grad_outputs</span><span class="o">=</span><span class="n">d</span><span class="o">.</span><span class="n">new_ones</span><span class="p">(</span><span class="n">d</span><span class="o">.</span><span class="n">shape</span><span class="p">),</span>
+<span class="lineno">852</span>                                            <span class="n">create_graph</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-177'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-177'>#</a>
+                </div>
+                <p>Reshape gradients to calculate the norm</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">855</span>        <span class="n">gradients</span> <span class="o">=</span> <span class="n">gradients</span><span class="o">.</span><span class="n">reshape</span><span class="p">(</span><span class="n">batch_size</span><span class="p">,</span> <span class="o">-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-178'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-178'>#</a>
+                </div>
+                <p>Calculate the norm $\Vert \nabla_{x} D(x)^2 \Vert$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">857</span>        <span class="n">norm</span> <span class="o">=</span> <span class="n">gradients</span><span class="o">.</span><span class="n">norm</span><span class="p">(</span><span class="mi">2</span><span class="p">,</span> <span class="n">dim</span><span class="o">=-</span><span class="mi">1</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-179'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-179'>#</a>
+                </div>
+                <p>Return the loss $\Vert \nabla_x D_\psi(x)^2 \Vert$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">859</span>        <span class="k">return</span> <span class="n">torch</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="n">norm</span> <span class="o">**</span> <span class="mi">2</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-180'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-180'>#</a>
+                </div>
+                <p><a id="path_length_penalty"></a></p>
+<h2>Path Length Penalty</h2>
+<p>This regularization encourages a fixed-size step in $w$ to result in a fixed-magnitude
+change in the image.</p>
+<p>
+<script type="math/tex; mode=display">\mathbb{E}_{w \sim f(z), y \sim \mathcal{N}(0, \mathbf{I})}
+  \Big(\Vert \mathbf{J}^\top_{w} y \Vert_2 - a \Big)^2</script>
+</p>
+<p>where $\mathbf{J}_w$ is the Jacobian
+$\mathbf{J}_w = \frac{\partial g}{\partial w}$,
+$w$ are sampled from $w \in \mathcal{W}$ from the mapping network, and
+$y$ are images with noise $\mathcal{N}(0, \mathbf{I})$.</p>
+<p>$a$ is the exponential moving average of $\Vert \mathbf{J}^\top_{w} y \Vert_2$
+as the training progresses.</p>
+<p>$\mathbf{J}^\top_{w} y$ is calculated without explicitly calculating the Jacobian using
+<script type="math/tex; mode=display">\mathbf{J}^\top_{w} y = \nabla_w \big(g(w) \cdot y \big)</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">862</span><span class="k">class</span> <span class="nc">PathLengthPenalty</span><span class="p">(</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-181'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-181'>#</a>
+                </div>
+                <ul>
+<li><code>beta</code> is the constant $\beta$ used to calculate the exponential moving average $a$</li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">885</span>    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">beta</span><span class="p">:</span> <span class="nb">float</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-182'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-182'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">889</span>        <span class="nb">super</span><span class="p">()</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-183'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-183'>#</a>
+                </div>
+                <p>$\beta$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">892</span>        <span class="bp">self</span><span class="o">.</span><span class="n">beta</span> <span class="o">=</span> <span class="n">beta</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-184'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-184'>#</a>
+                </div>
+                <p>Number of steps calculated $N$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">894</span>        <span class="bp">self</span><span class="o">.</span><span class="n">steps</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">tensor</span><span class="p">(</span><span class="mf">0.</span><span class="p">),</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-185'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-185'>#</a>
+                </div>
+                <p>Exponential sum of $\mathbf{J}^\top_{w} y$
+<script type="math/tex; mode=display">\sum^N_{i=1} \beta^{(N - i)}[\mathbf{J}^\top_{w} y]_i</script>
+where $[\mathbf{J}^\top_{w} y]_i$ is the value of it at $i$-th step of training</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">898</span>        <span class="bp">self</span><span class="o">.</span><span class="n">exp_sum_a</span> <span class="o">=</span> <span class="n">nn</span><span class="o">.</span><span class="n">Parameter</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">tensor</span><span class="p">(</span><span class="mf">0.</span><span class="p">),</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-186'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-186'>#</a>
+                </div>
+                <ul>
+<li><code>w</code> is the batch of $w$ of shape <code>[batch_size, d_latent]</code></li>
+<li><code>x</code> are the generated images of shape <code>[batch_size, 3, height, width]</code></li>
+</ul>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">900</span>    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">w</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">,</span> <span class="n">x</span><span class="p">:</span> <span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-187'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-187'>#</a>
+                </div>
+                <p>Get the device</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">907</span>        <span class="n">device</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">device</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-188'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-188'>#</a>
+                </div>
+                <p>Get number of pixels</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">909</span>        <span class="n">image_size</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">2</span><span class="p">]</span> <span class="o">*</span> <span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">3</span><span class="p">]</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-189'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-189'>#</a>
+                </div>
+                <p>Calculate $y \in \mathcal{N}(0, \mathbf{I})$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">911</span>        <span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">x</span><span class="o">.</span><span class="n">shape</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-190'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-190'>#</a>
+                </div>
+                <p>Calculate $\big(g(w) \cdot y \big)$ and normalize by the square root of image size.
+This is scaling is not mentioned in the paper but was present in
+<a href="https://github.com/NVlabs/stylegan2/blob/master/training/loss.py#L167">their implementation</a>.</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">915</span>        <span class="n">output</span> <span class="o">=</span> <span class="p">(</span><span class="n">x</span> <span class="o">*</span> <span class="n">y</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span> <span class="o">/</span> <span class="n">math</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">image_size</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-191'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-191'>#</a>
+                </div>
+                <p>Calculate gradients to get $\mathbf{J}^\top_{w} y$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">918</span>        <span class="n">gradients</span><span class="p">,</span> <span class="o">*</span><span class="n">_</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">autograd</span><span class="o">.</span><span class="n">grad</span><span class="p">(</span><span class="n">outputs</span><span class="o">=</span><span class="n">output</span><span class="p">,</span>
+<span class="lineno">919</span>                                            <span class="n">inputs</span><span class="o">=</span><span class="n">w</span><span class="p">,</span>
+<span class="lineno">920</span>                                            <span class="n">grad_outputs</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="n">output</span><span class="o">.</span><span class="n">shape</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">),</span>
+<span class="lineno">921</span>                                            <span class="n">create_graph</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-192'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-192'>#</a>
+                </div>
+                <p>Calculate L2-norm of $\mathbf{J}^\top_{w} y$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">924</span>        <span class="n">norm</span> <span class="o">=</span> <span class="p">(</span><span class="n">gradients</span> <span class="o">**</span> <span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">(</span><span class="n">dim</span><span class="o">=</span><span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="n">dim</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span><span class="o">.</span><span class="n">sqrt</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-193'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-193'>#</a>
+                </div>
+                <p>Regularize after first step</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">927</span>        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">steps</span> <span class="o">&gt;</span> <span class="mi">0</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-194'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-194'>#</a>
+                </div>
+                <p>Calculate $a$
+<script type="math/tex; mode=display">\frac{1}{1 - \beta^N} \sum^N_{i=1} \beta^{(N - i)}[\mathbf{J}^\top_{w} y]_i</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">930</span>            <span class="n">a</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">exp_sum_a</span> <span class="o">/</span> <span class="p">(</span><span class="mi">1</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">beta</span> <span class="o">**</span> <span class="bp">self</span><span class="o">.</span><span class="n">steps</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-195'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-195'>#</a>
+                </div>
+                <p>Calculate the penalty
+<script type="math/tex; mode=display">\mathbb{E}_{w \sim f(z), y \sim \mathcal{N}(0, \mathbf{I})}
+\Big(\Vert \mathbf{J}^\top_{w} y \Vert_2 - a \Big)^2</script>
+</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">934</span>            <span class="n">loss</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">mean</span><span class="p">((</span><span class="n">norm</span> <span class="o">-</span> <span class="n">a</span><span class="p">)</span> <span class="o">**</span> <span class="mi">2</span><span class="p">)</span>
+<span class="lineno">935</span>        <span class="k">else</span><span class="p">:</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-196'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-196'>#</a>
+                </div>
+                <p>Return a dummy loss if we can&rsquo;t calculate $a$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">937</span>            <span class="n">loss</span> <span class="o">=</span> <span class="n">norm</span><span class="o">.</span><span class="n">new_tensor</span><span class="p">(</span><span class="mi">0</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-197'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-197'>#</a>
+                </div>
+                <p>Calculate the mean of $\Vert \mathbf{J}^\top_{w} y \Vert_2$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">940</span>        <span class="n">mean</span> <span class="o">=</span> <span class="n">norm</span><span class="o">.</span><span class="n">mean</span><span class="p">()</span><span class="o">.</span><span class="n">detach</span><span class="p">()</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-198'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-198'>#</a>
+                </div>
+                <p>Update exponential sum</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">942</span>        <span class="bp">self</span><span class="o">.</span><span class="n">exp_sum_a</span><span class="o">.</span><span class="n">mul_</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">beta</span><span class="p">)</span><span class="o">.</span><span class="n">add_</span><span class="p">(</span><span class="n">mean</span><span class="p">,</span> <span class="n">alpha</span><span class="o">=</span><span class="mi">1</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">beta</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-199'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-199'>#</a>
+                </div>
+                <p>Increment $N$</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">944</span>        <span class="bp">self</span><span class="o">.</span><span class="n">steps</span><span class="o">.</span><span class="n">add_</span><span class="p">(</span><span class="mf">1.</span><span class="p">)</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-200'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-200'>#</a>
+                </div>
+                <p>Return the penalty</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">947</span>        <span class="k">return</span> <span class="n">loss</span></pre></div>
+            </div>
+        </div>
+    </div>
+</div>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.4/MathJax.js?config=TeX-AMS_HTML">
+</script>
+<!-- MathJax configuration -->
+<script type="text/x-mathjax-config">
+    MathJax.Hub.Config({
+        tex2jax: {
+            inlineMath: [ ['$','$'] ],
+            displayMath: [ ['$$','$$'] ],
+            processEscapes: true,
+            processEnvironments: true
+        },
+        // Center justify equations in code and markdown cells. Elsewhere
+        // we use CSS to left justify single line equations in code cells.
+        displayAlign: 'center',
+        "HTML-CSS": { fonts: ["TeX"] }
+    });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
+
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
+
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
+
+        var modal = document.createElement('div')
+        modal.id = 'modal'
+
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
+
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
+
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
+
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
+
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
+
+    handleImages()
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/docs/gan/stylegan/mapping_network.svg b/docs/gan/stylegan/mapping_network.svg
new file mode 100644
index 00000000..69219405
--- /dev/null
+++ b/docs/gan/stylegan/mapping_network.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="304px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 121.0 324.0" width="101px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="0" y="50"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 60px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Norm</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="64">Norm</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="0" y="100"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 110px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="114">Linear</text></switch></g><path class="black-stroke" d="M 40 70 L 40 93.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 98.88 L 36.5 91.88 L 40 93.63 L 43.5 91.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 40 20 L 40 43.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 48.88 L 36.5 41.88 L 40 43.63 L 43.5 41.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 10px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">z</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="14">z</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="0" y="150"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 160px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="164">Linear</text></switch></g><path class="black-stroke" d="M 40 120 L 40 143.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 148.88 L 36.5 141.88 L 40 143.63 L 43.5 141.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="0" y="220"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 230px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="234">Linear</text></switch></g><path class="black-stroke" d="M 40 170 L 40 213.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 218.88 L 36.5 211.88 L 40 213.63 L 43.5 211.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 195px; margin-left: 40px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; background-color: #ffffff; white-space: nowrap; ">More layers</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="40" y="198">More layers</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 280px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">w</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="40" y="284">w</text></switch></g><path class="black-stroke" d="M 40 240 L 40 263.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 40 268.88 L 36.5 261.88 L 40 263.63 L 43.5 261.88 Z" pointer-events="none" stroke-miterlimit="10"/></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/progressive_gan.svg b/docs/gan/stylegan/progressive_gan.svg
new file mode 100644
index 00000000..cc150e61
--- /dev/null
+++ b/docs/gan/stylegan/progressive_gan.svg
@@ -0,0 +1,87 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="659px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 623.0 679.0" width="603px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><path class="black-stroke" d="M 41 338 L 601 338" fill="none" pointer-events="stroke" stroke-dasharray="2 6" stroke-miterlimit="10" stroke-width="2"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="341" y="78"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 88px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="92">4x4</text></switch></g><path class="black-stroke" d="M 381 148 L 381 168 L 381 158 L 381 171.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 176.88 L 377.5 169.88 L 381 171.63 L 384.5 169.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 341 138 L 261 138 L 261 221.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 261 226.88 L 257.5 219.88 L 261 221.63 L 264.5 219.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="341" y="128"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 138px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">2x</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="142">2x</text></switch></g><path class="black-stroke" d="M 381 98 L 381 118 L 381 108 L 381 121.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 126.88 L 377.5 119.88 L 381 121.63 L 384.5 119.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 381 458 L 381 478 L 381 468 L 381 481.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 486.88 L 377.5 479.88 L 381 481.63 L 384.5 479.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="341" y="438"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 448px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">fromRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="452">fromRGB</text></switch></g><path class="black-stroke" d="M 381 508 L 381 528 L 381 518 L 381 531.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 536.88 L 377.5 529.88 L 381 531.63 L 384.5 529.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="341" y="488"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 498px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">8x8</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="502">8x8</text></switch></g><path class="black-stroke" d="M 381 198 L 381 218 L 381 208 L 381 221.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 226.88 L 377.5 219.88 L 381 221.63 L 384.5 219.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="341" y="178"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 188px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">8x8<br/></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="192">8x8
+</text></switch></g><path class="black-stroke" d="M 261 248 L 261 288 L 364.63 288" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 369.88 288 L 362.88 291.5 L 364.63 288 L 362.88 284.5 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 268px; margin-left: 261px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; ">1-⍺</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="261" y="271">1-⍺</text></switch></g><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="221" y="228"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 238px; margin-left: 222px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="261" y="242">toRGB</text></switch></g><path class="black-stroke" d="M 381 248 L 381 268 L 381 258 L 381 271.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 276.88 L 377.5 269.88 L 381 271.63 L 384.5 269.88 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 262px; margin-left: 381px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; ">⍺</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="381" y="265">⍺</text></switch></g><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="341" y="228"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 238px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="242">toRGB</text></switch></g><path class="black-stroke" d="M 381 298 L 381 381.63" fill="none" pointer-events="stroke" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 386.88 L 377.5 379.88 L 381 381.63 L 384.5 379.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="381" cy="288" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 288px; margin-left: 372px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="292">+</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="61" y="78"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 88px; margin-left: 62px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="101" y="92">4x4</text></switch></g><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="61" y="128"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 138px; margin-left: 62px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="101" y="142">toRGB</text></switch></g><path class="black-stroke" d="M 101 98 L 101 118 L 101 108 L 101 121.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 101 126.88 L 97.5 119.88 L 101 121.63 L 104.5 119.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="61" y="588"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 598px; margin-left: 62px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">fromRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="101" y="602">fromRGB</text></switch></g><path class="black-stroke" d="M 101 148 L 101 581.63" fill="none" pointer-events="stroke" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 101 586.88 L 97.5 579.88 L 101 581.63 L 104.5 579.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="61" y="638"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 648px; margin-left: 62px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="101" y="652">4x4</text></switch></g><path class="black-stroke" d="M 101 608 L 101 628 L 101 618 L 101 631.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 101 636.88 L 97.5 629.88 L 101 631.63 L 104.5 629.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 381 408 L 381 431.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 436.88 L 377.5 429.88 L 381 431.63 L 384.5 429.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 371 398 L 307.37 398" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 302.12 398 L 309.12 394.5 L 307.37 398 L 309.12 401.5 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="381" cy="398" pointer-events="all" rx="10" ry="10"/><path class="black-stroke" d="M 261 408 L 261 428 L 261 418 L 261 431.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 261 436.88 L 257.5 429.88 L 261 431.63 L 264.5 429.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="221" y="388"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 398px; margin-left: 222px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">0.5x</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="261" y="402">0.5x</text></switch></g><path class="black-stroke" d="M 261 458 L 261 598 L 364.63 598" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 369.88 598 L 362.88 601.5 L 364.63 598 L 362.88 594.5 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 569px; margin-left: 262px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; ">1-⍺</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="262" y="572">1-⍺</text></switch></g><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="221" y="438"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 448px; margin-left: 222px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">fromRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="261" y="452">fromRGB</text></switch></g><path class="black-stroke" d="M 381 558 L 381 578 L 381 568 L 381 581.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 586.88 L 377.5 579.88 L 381 581.63 L 384.5 579.88 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 570px; margin-left: 383px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; ">⍺</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="383" y="573">⍺</text></switch></g><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="341" y="538"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 548px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">0.5x</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="552">0.5x</text></switch></g><path class="black-stroke" d="M 381 608 L 381 628 L 381 618 L 381 631.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 381 636.88 L 377.5 629.88 L 381 631.63 L 384.5 629.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="blue-stroke blue-fill" cx="381" cy="598" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 598px; margin-left: 372px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="602">+</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="341" y="638"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 648px; margin-left: 342px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="381" y="652">4x4</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="501" y="78"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 88px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="92">4x4</text></switch></g><path class="black-stroke" d="M 541 148 L 541 168 L 541 158 L 541 171.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 176.88 L 537.5 169.88 L 541 171.63 L 544.5 169.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="501" y="128"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 138px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">2x</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="142">2x</text></switch></g><path class="black-stroke" d="M 541 98 L 541 118 L 541 108 L 541 121.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 126.88 L 537.5 119.88 L 541 121.63 L 544.5 119.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 541 458 L 541 478 L 541 468 L 541 481.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 486.88 L 537.5 479.88 L 541 481.63 L 544.5 479.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="501" y="438"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 448px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">fromRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="452">fromRGB</text></switch></g><path class="black-stroke" d="M 541 508 L 541 528 L 541 518 L 541 531.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 536.88 L 537.5 529.88 L 541 531.63 L 544.5 529.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="501" y="488"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 498px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">8x8</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="502">8x8</text></switch></g><path class="black-stroke" d="M 541 198 L 541 218 L 541 208 L 541 221.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 226.88 L 537.5 219.88 L 541 221.63 L 544.5 219.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="501" y="178"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 188px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">8x8<br/></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="192">8x8
+</text></switch></g><path class="black-stroke" d="M 541 248 L 541 268 L 541 258 L 541 271.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 276.88 L 537.5 269.88 L 541 271.63 L 544.5 269.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="501" y="228"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 238px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="242">toRGB</text></switch></g><path class="black-stroke" d="M 541 298 L 541 381.63" fill="none" pointer-events="stroke" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 386.88 L 537.5 379.88 L 541 381.63 L 544.5 379.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="541" cy="288" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 288px; margin-left: 532px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="292">+</text></switch></g><path class="black-stroke" d="M 541 408 L 541 431.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 436.88 L 537.5 429.88 L 541 431.63 L 544.5 429.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="541" cy="398" pointer-events="all" rx="10" ry="10"/><path class="black-stroke" d="M 541 558 L 541 578 L 541 568 L 541 581.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 586.88 L 537.5 579.88 L 541 581.63 L 544.5 579.88 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 573px; margin-left: 541px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; "><br/><br/></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="541" y="576">...</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 570px; margin-left: 543px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; "><br/></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="543" y="573"/></switch></g><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="501" y="538"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 548px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">0.5x</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="552">0.5x</text></switch></g><path class="black-stroke" d="M 541 608 L 541 628 L 541 618 L 541 631.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 541 636.88 L 537.5 629.88 L 541 631.63 L 544.5 629.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="blue-stroke blue-fill" cx="541" cy="598" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 598px; margin-left: 532px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="602">+</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="501" y="638"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 648px; margin-left: 502px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="541" y="652">4x4</text></switch></g><rect fill="none" height="20" pointer-events="all" stroke="none" width="40" x="21" y="298"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 308px; margin-left: 22px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Generator<br style="font-size: 14px"/></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="14px" text-anchor="middle" x="41" y="312">Genera...</text></switch></g><rect fill="none" height="20" pointer-events="all" stroke="none" width="40" x="21" y="358"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 368px; margin-left: 22px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 14px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Discriminator</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="14px" text-anchor="middle" x="41" y="372">Discri...</text></switch></g><path class="black-stroke" d="M 101 8 L 534.63 8" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 539.88 8 L 532.88 11.5 L 534.63 8 L 532.88 4.5 Z" pointer-events="all" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 7px; margin-left: 326px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; background-color: #ffffff; white-space: nowrap; "><span class="has-background" style="font-size: 12px ; background-color: rgb(248 , 249 , 250)">Progressive Growing</span></div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="326" y="10">Progressive Growing</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/style_block.svg b/docs/gan/stylegan/style_block.svg
new file mode 100644
index 00000000..01e57797
--- /dev/null
+++ b/docs/gan/stylegan/style_block.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="263px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 336.0 283.0" width="316px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="200" y="129"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 139px; margin-left: 201px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="143">3X3 Conv</text></switch></g><path class="black-stroke" d="M 240 194 L 240 247.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 252.88 L 236.5 245.88 L 240 247.63 L 243.5 245.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="240" cy="184" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 184px; margin-left: 231px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="188">+</text></switch></g><path class="black-stroke" d="M 240 149 L 240 169 L 240 154 L 240 167.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 172.88 L 236.5 165.88 L 240 167.63 L 243.5 165.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 295 184 L 256.37 184" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 251.12 184 L 258.12 180.5 L 256.37 184 L 258.12 187.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="295" y="174"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 184px; margin-left: 296px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="305" y="188">B</text></switch></g><path class="black-stroke" d="M 20 89 L 63.63 89" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 68.88 89 L 61.88 92.5 L 63.63 89 L 61.88 85.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="0" y="79"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 89px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="10" y="93">A</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="129"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 139px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="143">Demod</text></switch></g><path class="black-stroke" d="M 110 99 L 110 119 L 110 109 L 110 122.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 127.88 L 106.5 120.88 L 110 122.63 L 113.5 120.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="70" y="79"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 89px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="93">Mod</text></switch></g><path class="black-stroke" d="M 110 44 L 110 72.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 77.88 L 106.5 70.88 L 110 72.63 L 113.5 70.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 34px; margin-left: 91px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="38">weights</text></switch></g><path class="black-stroke" d="M 150 139 L 193.63 139" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 198.88 139 L 191.88 142.5 L 193.63 139 L 191.88 135.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 160 184 L 223.63 184" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 228.88 184 L 221.88 187.5 L 223.63 184 L 221.88 180.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 184px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="140" y="188">bias</text></switch></g><path class="black-stroke" d="M 240 24 L 240 122.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 127.88 L 236.5 120.88 L 240 122.63 L 243.5 120.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 14px; margin-left: 221px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">feature map</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="18">featur...</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/style_gan.svg b/docs/gan/stylegan/style_gan.svg
new file mode 100644
index 00000000..dfe963b4
--- /dev/null
+++ b/docs/gan/stylegan/style_gan.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="1089px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 401.0 1109.0" width="381px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><path class="black-stroke" d="M 60 330 L 60 370 L 113.63 370" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 118.88 370 L 111.88 373.5 L 113.63 370 L 111.88 366.5 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 60 330 L 60 520 L 113.63 520" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 118.88 520 L 111.88 523.5 L 113.63 520 L 111.88 516.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="grey-stroke grey-fill" height="315" pointer-events="none" width="120" x="160" y="235"/><rect class="orange-stroke orange-fill" height="30" pointer-events="none" width="80" x="180" y="250"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 265px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">512x4x4 Const</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="269">512x4x4 Const</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="180" y="410"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 420px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="424">3x3 Conv</text></switch></g><ellipse class="grey-stroke grey-fill" cx="220" cy="320" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 320px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="324">+</text></switch></g><path class="black-stroke" d="M 220 280 L 220 300 L 220 290 L 220 303.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 308.88 L 216.5 301.88 L 220 303.63 L 223.5 301.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 300 320 L 236.37 320" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 231.12 320 L 238.12 316.5 L 236.37 320 L 238.12 323.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="300" y="310"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 320px; margin-left: 301px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="310" y="324">B</text></switch></g><path class="black-stroke" d="M 340 320 L 320 320 L 340 320 L 326.37 320" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 321.12 320 L 328.12 316.5 L 326.37 320 L 328.12 323.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 320px; margin-left: 341px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">noise</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="360" y="324">noise</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="120" y="360"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 370px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="130" y="374">A</text></switch></g><path class="black-stroke" d="M 220 380 L 220 403.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 408.88 L 216.5 401.88 L 220 403.63 L 223.5 401.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="180" y="360"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 370px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">AdaIN</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="374">AdaIN</text></switch></g><path class="black-stroke" d="M 220 330 L 220 350 L 220 340 L 220 353.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 358.88 L 216.5 351.88 L 220 353.63 L 223.5 351.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 140 370 L 173.63 370" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 370 L 171.88 373.5 L 173.63 370 L 171.88 366.5 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="220" cy="470" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 470px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="474">+</text></switch></g><path class="black-stroke" d="M 220 430 L 220 453.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 458.88 L 216.5 451.88 L 220 453.63 L 223.5 451.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 300 470 L 236.37 470" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 231.12 470 L 238.12 466.5 L 236.37 470 L 238.12 473.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="300" y="460"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 470px; margin-left: 301px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="310" y="474">B</text></switch></g><path class="black-stroke" d="M 340 470 L 320 470 L 340 470 L 326.37 470" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 321.12 470 L 328.12 466.5 L 326.37 470 L 328.12 473.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 470px; margin-left: 341px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">noise</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="360" y="474">noise</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="180" y="510"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 520px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">AdaIN</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="524">AdaIN</text></switch></g><path class="black-stroke" d="M 220 480 L 220 500 L 220 490 L 220 503.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 508.88 L 216.5 501.88 L 220 503.63 L 223.5 501.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 140 520 L 173.63 520" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 520 L 171.88 523.5 L 173.63 520 L 171.88 516.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="120" y="510"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 520px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="130" y="524">A</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 540px; margin-left: 241px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="260" y="544">4x4</text></switch></g><rect class="grey-stroke grey-fill" height="355" pointer-events="none" width="120" x="160" y="590"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="180" y="660"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 670px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="674">3X3 Conv</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="180" y="805"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 815px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="819">3x3 Conv</text></switch></g><ellipse class="grey-stroke grey-fill" cx="220" cy="715" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 715px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="719">+</text></switch></g><path class="black-stroke" d="M 220 680 L 220 700 L 220 685 L 220 698.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 703.88 L 216.5 696.88 L 220 698.63 L 223.5 696.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 300 715 L 236.37 715" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 231.12 715 L 238.12 711.5 L 236.37 715 L 238.12 718.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="300" y="705"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 715px; margin-left: 301px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="310" y="719">B</text></switch></g><path class="black-stroke" d="M 340 715 L 320 715 L 340 715 L 326.37 715" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 321.12 715 L 328.12 711.5 L 326.37 715 L 328.12 718.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 715px; margin-left: 341px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">noise</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="360" y="719">noise</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="120" y="755"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 765px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="130" y="769">A</text></switch></g><path class="black-stroke" d="M 220 775 L 220 798.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 803.88 L 216.5 796.88 L 220 798.63 L 223.5 796.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="180" y="755"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 765px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">AdaIN</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="769">AdaIN</text></switch></g><path class="black-stroke" d="M 220 725 L 220 745 L 220 735 L 220 748.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 753.88 L 216.5 746.88 L 220 748.63 L 223.5 746.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 140 765 L 173.63 765" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 765 L 171.88 768.5 L 173.63 765 L 171.88 761.5 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="220" cy="865" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 865px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="869">+</text></switch></g><path class="black-stroke" d="M 220 825 L 220 848.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 853.88 L 216.5 846.88 L 220 848.63 L 223.5 846.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 300 865 L 236.37 865" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 231.12 865 L 238.12 861.5 L 236.37 865 L 238.12 868.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="300" y="855"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 865px; margin-left: 301px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="310" y="869">B</text></switch></g><path class="black-stroke" d="M 340 865 L 320 865 L 340 865 L 326.37 865" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 321.12 865 L 328.12 861.5 L 326.37 865 L 328.12 868.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 865px; margin-left: 341px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">noise</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="360" y="869">noise</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="180" y="905"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 915px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">AdaIN</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="919">AdaIN</text></switch></g><path class="black-stroke" d="M 220 875 L 220 895 L 220 885 L 220 898.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 903.88 L 216.5 896.88 L 220 898.63 L 223.5 896.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 140 915 L 173.63 915" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 915 L 171.88 918.5 L 173.63 915 L 171.88 911.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="120" y="905"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 915px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="130" y="919">A</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 935px; margin-left: 241px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">8x8</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="260" y="939">8x8</text></switch></g><path class="black-stroke" d="M 220 630 L 220 653.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 658.88 L 216.5 651.88 L 220 653.63 L 223.5 651.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="none" width="80" x="180" y="610"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 620px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Upsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="624">Upsample</text></switch></g><path class="black-stroke" d="M 220 530 L 220 603.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 608.88 L 216.5 601.88 L 220 603.63 L 223.5 601.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="grey-stroke grey-fill" height="342.5" pointer-events="none" width="120" x="0" y="0"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="20" y="90"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 100px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Norm</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="104">Norm</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="20" y="140"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 150px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="154">Linear</text></switch></g><path class="black-stroke" d="M 60 110 L 60 133.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 138.88 L 56.5 131.88 L 60 133.63 L 63.5 131.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 60 60 L 60 83.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 88.88 L 56.5 81.88 L 60 83.63 L 63.5 81.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 50px; margin-left: 41px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">z</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="54">z</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="20" y="190"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 200px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="204">Linear</text></switch></g><path class="black-stroke" d="M 60 160 L 60 183.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 188.88 L 56.5 181.88 L 60 183.63 L 63.5 181.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="20" y="260"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 270px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Linear</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="274">Linear</text></switch></g><path class="black-stroke" d="M 60 210 L 60 253.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 258.88 L 56.5 251.88 L 60 253.63 L 63.5 251.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 235px; margin-left: 60px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; background-color: #ffffff; white-space: nowrap; ">More layers</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="60" y="238">More layers</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 320px; margin-left: 41px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">w</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="324">w</text></switch></g><path class="black-stroke" d="M 60 280 L 60 303.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 308.88 L 56.5 301.88 L 60 303.63 L 63.5 301.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 58px; height: 1px; padding-top: 25px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mapping Network</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="30" y="29">Mapping Ne...</text></switch></g><path class="black-stroke" d="M 60 330 L 60 765 L 113.63 765" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 118.88 765 L 111.88 768.5 L 113.63 765 L 111.88 761.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 60 330 L 60 915 L 113.63 915" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 118.88 915 L 111.88 918.5 L 113.63 915 L 111.88 911.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 220 925 L 220 1003.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 1008.88 L 216.5 1001.88 L 220 1003.63 L 223.5 1001.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 968px; margin-left: 220px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; background-color: #ffffff; white-space: nowrap; ">more layers</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="220" y="971">more layers</text></switch></g><path class="black-stroke" d="M 220 1030 L 220 1073.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 220 1078.88 L 216.5 1071.88 L 220 1073.63 L 223.5 1071.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="none" width="80" x="180" y="1010"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 1020px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="220" y="1024">toRGB</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/style_gan2.svg b/docs/gan/stylegan/style_gan2.svg
new file mode 100644
index 00000000..6eef9967
--- /dev/null
+++ b/docs/gan/stylegan/style_gan2.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="999px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 491.0 1019.0" width="471px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="grey-stroke grey-fill" height="460" pointer-events="all" width="470" x="0" y="375"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="210" y="490"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 500px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="504">3X3 Conv</text></switch></g><path class="black-stroke" d="M 250 555 L 250 693.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 698.88 L 246.5 691.88 L 250 693.63 L 253.5 691.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="250" cy="545" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 545px; margin-left: 241px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="549">+</text></switch></g><path class="black-stroke" d="M 250 510 L 250 530 L 250 515 L 250 528.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 533.88 L 246.5 526.88 L 250 528.63 L 253.5 526.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 305 545 L 266.37 545" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 261.12 545 L 268.12 541.5 L 266.37 545 L 268.12 548.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="305" y="535"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 545px; margin-left: 306px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="315" y="549">B</text></switch></g><path class="black-stroke" d="M 30 450 L 73.63 450" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 78.88 450 L 71.88 453.5 L 73.63 450 L 71.88 446.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="10" y="440"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 450px; margin-left: 11px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="20" y="454">A</text></switch></g><path class="black-stroke" d="M 250 415 L 250 483.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 488.88 L 246.5 481.88 L 250 483.63 L 253.5 481.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="210" y="395"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 405px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Upsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="409">Upsample</text></switch></g><rect class="grey-stroke grey-fill" height="330" pointer-events="none" width="470" x="0" y="0"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="210" y="185"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 195px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="199">3x3 Conv</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="10" y="135"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 145px; margin-left: 11px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="20" y="149">A</text></switch></g><path class="black-stroke" d="M 250 255 L 250 285 L 283.63 285" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 288.88 285 L 281.88 288.5 L 283.63 285 L 281.88 281.5 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="250" cy="245" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 245px; margin-left: 241px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="249">+</text></switch></g><path class="black-stroke" d="M 250 205 L 250 228.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 233.88 L 246.5 226.88 L 250 228.63 L 253.5 226.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 315px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="20" y="319">4x4</text></switch></g><path class="black-stroke" d="M 30 145 L 73.63 145" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 78.88 145 L 71.88 148.5 L 73.63 145 L 71.88 141.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 170 245 L 233.63 245" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 238.88 245 L 231.88 248.5 L 233.63 245 L 231.88 241.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 245px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="150" y="249">bias</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="185"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 195px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="199">Demod</text></switch></g><path class="black-stroke" d="M 120 155 L 120 175 L 120 165 L 120 178.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 183.88 L 116.5 176.88 L 120 178.63 L 123.5 176.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="135"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 145px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="149">Mod</text></switch></g><path class="black-stroke" d="M 120 100 L 120 128.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 133.88 L 116.5 126.88 L 120 128.63 L 123.5 126.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 90px; margin-left: 101px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="94">weights</text></switch></g><path class="black-stroke" d="M 160 195 L 203.63 195" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 208.88 195 L 201.88 198.5 L 203.63 195 L 201.88 191.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="none" width="80" x="290" y="275"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 285px; margin-left: 291px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="330" y="289">toRGB</text></switch></g><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="305" y="235"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 245px; margin-left: 306px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="315" y="249">B</text></switch></g><path class="black-stroke" d="M 305 245 L 266.37 245" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 261.12 245 L 268.12 241.5 L 266.37 245 L 268.12 248.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 250 45 L 250 178.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 183.88 L 246.5 176.88 L 250 178.63 L 253.5 176.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="490"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 500px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="504">Demod</text></switch></g><path class="black-stroke" d="M 120 460 L 120 480 L 120 470 L 120 483.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 488.88 L 116.5 481.88 L 120 483.63 L 123.5 481.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="440"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 450px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="454">Mod</text></switch></g><path class="black-stroke" d="M 120 405 L 120 433.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 438.88 L 116.5 431.88 L 120 433.63 L 123.5 431.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 395px; margin-left: 101px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="399">weights</text></switch></g><path class="black-stroke" d="M 160 500 L 203.63 500" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 208.88 500 L 201.88 503.5 L 203.63 500 L 201.88 496.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="210" y="700"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 710px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="714">3X3 Conv</text></switch></g><path class="black-stroke" d="M 250 765 L 250 868.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 873.88 L 246.5 866.88 L 250 868.63 L 253.5 866.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 250 765 L 250 795 L 283.63 795" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 288.88 795 L 281.88 798.5 L 283.63 795 L 281.88 791.5 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="250" cy="755" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 755px; margin-left: 241px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="759">+</text></switch></g><path class="black-stroke" d="M 250 720 L 250 740 L 250 725 L 250 738.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 743.88 L 246.5 736.88 L 250 738.63 L 253.5 736.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 305 755 L 266.37 755" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 261.12 755 L 268.12 751.5 L 266.37 755 L 268.12 758.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="305" y="745"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 755px; margin-left: 306px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">B</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="315" y="759">B</text></switch></g><path class="black-stroke" d="M 30 660 L 73.63 660" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 78.88 660 L 71.88 663.5 L 73.63 660 L 71.88 656.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="20" x="10" y="650"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 660px; margin-left: 11px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="20" y="664">A</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="700"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 710px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Demod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="714">Demod</text></switch></g><path class="black-stroke" d="M 120 670 L 120 690 L 120 680 L 120 693.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 698.88 L 116.5 691.88 L 120 693.63 L 123.5 691.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="20" pointer-events="none" width="80" x="80" y="650"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 660px; margin-left: 81px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="664">Mod</text></switch></g><path class="black-stroke" d="M 120 615 L 120 643.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 120 648.88 L 116.5 641.88 L 120 643.63 L 123.5 641.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 605px; margin-left: 101px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="609">weights</text></switch></g><path class="black-stroke" d="M 160 710 L 203.63 710" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 208.88 710 L 201.88 713.5 L 203.63 710 L 201.88 706.5 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 170 545 L 233.63 545" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 238.88 545 L 231.88 548.5 L 233.63 545 L 231.88 541.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 545px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="150" y="549">bias</text></switch></g><path class="black-stroke" d="M 170 755 L 233.63 755" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 238.88 755 L 231.88 758.5 L 233.63 755 L 231.88 751.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 755px; margin-left: 131px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="150" y="759">bias</text></switch></g><path class="black-stroke" d="M 250 255 L 250 388.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 250 393.88 L 246.5 386.88 L 250 388.63 L 253.5 386.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 825px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">8x8</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="20" y="829">8x8</text></switch></g><path class="black-stroke" d="M 420 415 L 420 778.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 420 783.88 L 416.5 776.88 L 420 778.63 L 423.5 776.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="none" width="80" x="380" y="395"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 405px; margin-left: 381px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Upsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="420" y="409">Upsample</text></switch></g><path class="black-stroke" d="M 370 285 L 420 285 L 420 388.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 420 393.88 L 416.5 386.88 L 420 388.63 L 423.5 386.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 420 805 L 420 868.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 420 873.88 L 416.5 866.88 L 420 868.63 L 423.5 866.88 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="420" cy="795" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 795px; margin-left: 411px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="420" y="799">+</text></switch></g><path class="black-stroke" d="M 250.08 875 L 250.1 895 L 249.61 983.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 249.59 988.88 L 246.12 981.86 L 249.61 983.63 L 253.12 981.9 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 925px; margin-left: 250px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; background-color: #ffffff; white-space: nowrap; ">more layers</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="250" y="928">more layers</text></switch></g><path class="black-stroke" d="M 370 795 L 403.63 795" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 408.88 795 L 401.88 798.5 L 403.63 795 L 401.88 791.5 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="none" width="80" x="290" y="785"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 795px; margin-left: 291px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">toRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="330" y="799">toRGB</text></switch></g><rect class="orange-stroke orange-fill" height="30" pointer-events="none" width="80" x="210" y="15"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 30px; margin-left: 211px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">512x4x4 Const</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="250" y="34">512x4x4 Const</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/style_gan2_disc.svg b/docs/gan/stylegan/style_gan2_disc.svg
new file mode 100644
index 00000000..8ff194d8
--- /dev/null
+++ b/docs/gan/stylegan/style_gan2_disc.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="876px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 291.0 896.0" width="271px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="yellow-stroke yellow-fill" height="250" pointer-events="all" width="270" x="0" y="40"/><rect class="grey-stroke grey-fill" height="250" pointer-events="all" width="270" x="0" y="40"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="20" y="150"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 160px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="164">Downsample</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="150" y="100"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 110px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="114">3x3 Conv</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="150" y="150"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 160px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="164">3x3 Conv</text></switch></g><path class="black-stroke" d="M 190 120 L 190 140 L 190 130 L 190 143.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 148.88 L 186.5 141.88 L 190 143.63 L 193.5 141.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="all" width="80" x="150" y="200"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 210px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="214">Downsample</text></switch></g><path class="black-stroke" d="M 190 170 L 190 193.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 198.88 L 186.5 191.88 L 190 193.63 L 193.5 191.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="20" y="200"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 210px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">1x1 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="214">1x1 Conv</text></switch></g><path class="black-stroke" d="M 60 170 L 60 190 L 60 180 L 60 193.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 198.88 L 56.5 191.88 L 60 193.63 L 63.5 191.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="190" cy="260" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 260px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="264">+</text></switch></g><path class="black-stroke" d="M 190 220 L 190 240 L 190 230 L 190 243.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 248.88 L 186.5 241.88 L 190 243.63 L 193.5 241.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 60 220 L 60 260 L 173.63 260" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 260 L 171.88 263.5 L 173.63 260 L 171.88 256.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect fill="none" height="20" pointer-events="all" stroke="none" width="70" x="0" y="40"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 68px; height: 1px; padding-top: 50px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">1024x1024</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="35" y="54">1024x1024</text></switch></g><path class="black-stroke" d="M 190 20 L 190 80 L 60 80 L 60 143.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 148.88 L 56.5 141.88 L 60 143.63 L 63.5 141.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="blue-stroke blue-fill" height="20" pointer-events="all" width="80" x="150" y="0"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 10px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">fromRGB</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="14">fromRGB</text></switch></g><rect class="grey-stroke grey-fill" height="250" pointer-events="none" width="270" x="0" y="360"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="none" width="80" x="20" y="470"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 480px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="484">Downsample</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="150" y="420"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 430px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="434">3x3 Conv</text></switch></g><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="150" y="470"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 480px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="484">3x3 Conv</text></switch></g><path class="black-stroke" d="M 190 440 L 190 460 L 190 450 L 190 463.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 468.88 L 186.5 461.88 L 190 463.63 L 193.5 461.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="yellow-stroke yellow-fill" height="20" pointer-events="none" width="80" x="150" y="520"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 530px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Downsample</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="534">Downsample</text></switch></g><path class="black-stroke" d="M 190 490 L 190 513.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 518.88 L 186.5 511.88 L 190 513.63 L 193.5 511.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="20" y="520"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 530px; margin-left: 21px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">1x1 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="60" y="534">1x1 Conv</text></switch></g><path class="black-stroke" d="M 60 490 L 60 510 L 60 500 L 60 513.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 518.88 L 56.5 511.88 L 60 513.63 L 63.5 511.88 Z" pointer-events="none" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="190" cy="580" pointer-events="none" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 580px; margin-left: 181px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="584">+</text></switch></g><path class="black-stroke" d="M 190 540 L 190 560 L 190 550 L 190 563.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 568.88 L 186.5 561.88 L 190 563.63 L 193.5 561.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 60 540 L 60 580 L 173.63 580" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 178.88 580 L 171.88 583.5 L 173.63 580 L 171.88 576.5 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 68px; height: 1px; padding-top: 370px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">8x8</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="35" y="374">8x8</text></switch></g><path class="black-stroke" d="M 190 270 L 190 413.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 418.88 L 186.5 411.88 L 190 413.63 L 193.5 411.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 1px; height: 1px; padding-top: 321px; margin-left: 192px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div class="has-background" style="display: inline-block; font-size: 11px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; background-color: #ffffff; white-space: nowrap; ">More layers</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="11px" text-anchor="middle" x="192" y="324">More layers</text></switch></g><path class="black-stroke" d="M 190 590 L 190 633.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 638.88 L 186.5 631.88 L 190 633.63 L 193.5 631.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="grey-stroke grey-fill" height="115" pointer-events="none" width="170" x="100" y="625"/><rect class="black-stroke white-fill" height="20" pointer-events="none" width="80" x="150" y="700"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 710px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">3x3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="714">3x3 Conv</text></switch></g><path class="black-stroke" d="M 190 670 L 190 693.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 698.88 L 186.5 691.88 L 190 693.63 L 193.5 691.88 Z" pointer-events="none" stroke-miterlimit="10"/><rect class="green-stroke green-fill" height="30" pointer-events="none" width="80" x="150" y="640"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 655px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Minibatch StdDev</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="659">Minibatch Std...</text></switch></g><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 635px; margin-left: 101px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">4x4</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="639">4x4</text></switch></g><rect class="grey-stroke grey-fill" height="115" pointer-events="none" width="170" x="100" y="760"/><rect class="red-stroke red-fill" height="20" pointer-events="none" width="80" x="150" y="835"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 845px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Classify</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="849">Classify</text></switch></g><path class="black-stroke" d="M 190 800 L 190 828.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 833.88 L 186.5 826.88 L 190 828.63 L 193.5 826.88 Z" pointer-events="none" stroke-miterlimit="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 770px; margin-left: 101px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">2x2</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="120" y="774">2x2</text></switch></g><rect class="grey-stroke grey-fill" height="20" pointer-events="none" width="80" x="150" y="780"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 790px; margin-left: 151px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: none; white-space: normal; word-wrap: normal; ">Flatten</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="190" y="794">Flatten</text></switch></g><path class="black-stroke" d="M 190 720 L 190 773.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 778.88 L 186.5 771.88 L 190 773.63 L 193.5 771.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 190 270 L 190 390 L 60 390 L 60 463.63" fill="none" pointer-events="none" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 60 468.88 L 56.5 461.88 L 60 463.63 L 63.5 461.88 Z" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke" d="M 190 20 L 190 93.63" fill="none" pointer-events="none" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 190 98.88 L 186.5 91.88 L 190 93.63 L 193.5 91.88 Z" pointer-events="none" stroke-miterlimit="10"/></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/stylegan/to_rgb.svg b/docs/gan/stylegan/to_rgb.svg
new file mode 100644
index 00000000..32d7ae2d
--- /dev/null
+++ b/docs/gan/stylegan/to_rgb.svg
@@ -0,0 +1,85 @@
+<?xml version="1.0" ?><!DOCTYPE svg  PUBLIC '-//W3C//DTD SVG 1.1//EN'  'http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd'><svg height="208px" style="background: #1d2127;" version="1.1" viewBox="-10.5 -10.5 301.0 228.0" width="281px" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><style>
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+</style><defs/><g><rect class="black-stroke white-fill" height="20" pointer-events="all" width="80" x="200" y="74"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 84px; margin-left: 201px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">3X3 Conv</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="88">3X3 Conv</text></switch></g><path class="black-stroke" d="M 240 139 L 240 192.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 197.88 L 236.5 190.88 L 240 192.63 L 243.5 190.88 Z" pointer-events="all" stroke-miterlimit="10"/><ellipse class="grey-stroke grey-fill" cx="240" cy="129" pointer-events="all" rx="10" ry="10"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 129px; margin-left: 231px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #333333; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">+</div></div></div></foreignObject><text fill="#333333" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="133">+</text></switch></g><path class="black-stroke" d="M 240 94 L 240 114 L 240 99 L 240 112.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 117.88 L 236.5 110.88 L 240 112.63 L 243.5 110.88 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 20 84 L 63.63 84" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 68.88 84 L 61.88 87.5 L 63.63 84 L 61.88 80.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect class="red-stroke red-fill" height="20" pointer-events="all" width="20" x="0" y="74"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 18px; height: 1px; padding-top: 84px; margin-left: 1px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">A</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="10" y="88">A</text></switch></g><path class="black-stroke" d="M 150 84 L 193.63 84" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 198.88 84 L 191.88 87.5 L 193.63 84 L 191.88 80.5 Z" pointer-events="all" stroke-miterlimit="10"/><path class="black-stroke" d="M 160 129 L 223.63 129" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 228.88 129 L 221.88 132.5 L 223.63 129 L 221.88 125.5 Z" pointer-events="all" stroke-miterlimit="10"/><rect fill="none" height="20" pointer-events="all" stroke="none" width="40" x="120" y="119"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 129px; margin-left: 121px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">bias</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="140" y="133">bias</text></switch></g><path class="black-stroke" d="M 240 24 L 240 67.63" fill="none" pointer-events="stroke" stroke-dasharray="3 3" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 240 72.88 L 236.5 65.88 L 240 67.63 L 243.5 65.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect fill="none" height="20" pointer-events="all" stroke="none" width="40" x="220" y="4"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 14px; margin-left: 221px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">feature map</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="240" y="18">featur...</text></switch></g><rect class="green-stroke green-fill" height="20" pointer-events="all" width="80" x="70" y="74"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 78px; height: 1px; padding-top: 84px; margin-left: 71px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">Mod</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="88">Mod</text></switch></g><path class="black-stroke" d="M 110 44 L 110 67.63" fill="none" pointer-events="stroke" stroke-miterlimit="10"/><path class="black-stroke black-fill" d="M 110 72.88 L 106.5 65.88 L 110 67.63 L 113.5 65.88 Z" pointer-events="all" stroke-miterlimit="10"/><rect fill="none" height="20" pointer-events="all" stroke="none" width="40" x="90" y="24"/><g transform="translate(-0.5 -0.5)"><switch><foreignObject height="100%" pointer-events="none" requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility" style="overflow: visible; text-align: left;" width="100%"><div style="display: flex; align-items: unsafe center; justify-content: unsafe center; width: 38px; height: 1px; padding-top: 34px; margin-left: 91px;" xmlns="http://www.w3.org/1999/xhtml"><div style="box-sizing: border-box; font-size: 0; text-align: center; "><div style="display: inline-block; font-size: 12px; font-family: Helvetica; color: #000000; line-height: 1.2; pointer-events: all; white-space: normal; word-wrap: normal; ">weights</div></div></div></foreignObject><text class="black-fill" font-family="Helvetica" font-size="12px" text-anchor="middle" x="110" y="38">weights</text></switch></g></g><switch><g requiredFeatures="http://www.w3.org/TR/SVG11/feature#Extensibility"/><a target="_blank" transform="translate(0,-5)" xlink:href="https://www.diagrams.net/doc/faq/svg-export-text-problems"><text font-size="10px" text-anchor="middle" x="50%" y="100%">Viewer does not support full SVG 1.1</text></a></switch></svg>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/experiment.html b/docs/gan/wasserstein/experiment.html
index c0f76c87..763c6a65 100644
--- a/docs/gan/wasserstein/experiment.html
+++ b/docs/gan/wasserstein/experiment.html
@@ -199,19 +199,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/gradient_penalty/experiment.html b/docs/gan/wasserstein/gradient_penalty/experiment.html
index 40676390..84917eb7 100644
--- a/docs/gan/wasserstein/gradient_penalty/experiment.html
+++ b/docs/gan/wasserstein/gradient_penalty/experiment.html
@@ -332,19 +332,46 @@ includes gradient penalty.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/gradient_penalty/index.html b/docs/gan/wasserstein/gradient_penalty/index.html
index 0c67e878..6270f7c9 100644
--- a/docs/gan/wasserstein/gradient_penalty/index.html
+++ b/docs/gan/wasserstein/gradient_penalty/index.html
@@ -221,19 +221,46 @@ with respect to weight on this loss.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/gradient_penalty/readme.html b/docs/gan/wasserstein/gradient_penalty/readme.html
index 11202230..f2b36fba 100644
--- a/docs/gan/wasserstein/gradient_penalty/readme.html
+++ b/docs/gan/wasserstein/gradient_penalty/readme.html
@@ -110,19 +110,46 @@ proposal a better way to improve Lipschitz constraint, a gradient penalty.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/index.html b/docs/gan/wasserstein/index.html
index 6107fd28..9261fcf3 100644
--- a/docs/gan/wasserstein/index.html
+++ b/docs/gan/wasserstein/index.html
@@ -251,19 +251,46 @@ so we minimize,
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/gan/wasserstein/readme.html b/docs/gan/wasserstein/readme.html
index 5ce53e36..6560d224 100644
--- a/docs/gan/wasserstein/readme.html
+++ b/docs/gan/wasserstein/readme.html
@@ -98,19 +98,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/hypernetworks/experiment.html b/docs/hypernetworks/experiment.html
index 20e0bd2f..9048fd4e 100644
--- a/docs/hypernetworks/experiment.html
+++ b/docs/hypernetworks/experiment.html
@@ -343,19 +343,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/hypernetworks/hyper_lstm.html b/docs/hypernetworks/hyper_lstm.html
index 2196d261..591be297 100644
--- a/docs/hypernetworks/hyper_lstm.html
+++ b/docs/hypernetworks/hyper_lstm.html
@@ -741,19 +741,46 @@ Rest of the layers get the input from the layer below</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/hypernetworks/index.html b/docs/hypernetworks/index.html
index c6d59acb..a3099fd4 100644
--- a/docs/hypernetworks/index.html
+++ b/docs/hypernetworks/index.html
@@ -95,19 +95,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/index.html b/docs/index.html
index 498059d7..7938bf98 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -172,19 +172,46 @@ implementations.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/lstm/index.html b/docs/lstm/index.html
index 16708835..be066378 100644
--- a/docs/lstm/index.html
+++ b/docs/lstm/index.html
@@ -471,19 +471,46 @@ Rest of the layers get the input from the layer below</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/batch_channel_norm/index.html b/docs/normalization/batch_channel_norm/index.html
index 7332e8dc..ff1649f1 100644
--- a/docs/normalization/batch_channel_norm/index.html
+++ b/docs/normalization/batch_channel_norm/index.html
@@ -645,19 +645,46 @@ $Var[x_{(i_N, i_G)}] = \mathbb{E}[x^2_{(i_N, i_G)}] - \mathbb{E}[x_{(i_N, i_G)}]
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/batch_norm/cifar10.html b/docs/normalization/batch_norm/cifar10.html
index 2ab0fbb8..0f4be662 100644
--- a/docs/normalization/batch_norm/cifar10.html
+++ b/docs/normalization/batch_norm/cifar10.html
@@ -246,19 +246,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/batch_norm/index.html b/docs/normalization/batch_norm/index.html
index 5a7cdd58..6113f695 100644
--- a/docs/normalization/batch_norm/index.html
+++ b/docs/normalization/batch_norm/index.html
@@ -472,19 +472,46 @@ i.e. the means for each feature $\mathbb{E}[(x^{(k)})^2]$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/batch_norm/mnist.html b/docs/normalization/batch_norm/mnist.html
index edd68833..9a5f5889 100644
--- a/docs/normalization/batch_norm/mnist.html
+++ b/docs/normalization/batch_norm/mnist.html
@@ -318,19 +318,46 @@ and set a new function to calculate the model.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/batch_norm/readme.html b/docs/normalization/batch_norm/readme.html
index 8d490274..b119a47f 100644
--- a/docs/normalization/batch_norm/readme.html
+++ b/docs/normalization/batch_norm/readme.html
@@ -162,19 +162,46 @@ a CNN classifier that uses batch normalization for MNIST dataset.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/group_norm/experiment.html b/docs/normalization/group_norm/experiment.html
index 6e69db00..fc6d942f 100644
--- a/docs/normalization/group_norm/experiment.html
+++ b/docs/normalization/group_norm/experiment.html
@@ -356,19 +356,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/group_norm/index.html b/docs/normalization/group_norm/index.html
index 69b70cca..927c0eb3 100644
--- a/docs/normalization/group_norm/index.html
+++ b/docs/normalization/group_norm/index.html
@@ -395,19 +395,46 @@ $Var[x_{(i_N, i_G)}] = \mathbb{E}[x^2_{(i_N, i_G)}] - \mathbb{E}[x_{(i_N, i_G)}]
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/group_norm/readme.html b/docs/normalization/group_norm/readme.html
index 743354c1..fbadaf09 100644
--- a/docs/normalization/group_norm/readme.html
+++ b/docs/normalization/group_norm/readme.html
@@ -112,19 +112,46 @@ all channels within each group.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/index.html b/docs/normalization/index.html
index 6014ae8f..af176eaf 100644
--- a/docs/normalization/index.html
+++ b/docs/normalization/index.html
@@ -103,19 +103,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/instance_norm/experiment.html b/docs/normalization/instance_norm/experiment.html
index 51af5ad8..37d5cf60 100644
--- a/docs/normalization/instance_norm/experiment.html
+++ b/docs/normalization/instance_norm/experiment.html
@@ -337,19 +337,46 @@ style transfer and this is only a demo.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/instance_norm/index.html b/docs/normalization/instance_norm/index.html
index 44165a2f..34d5cbf2 100644
--- a/docs/normalization/instance_norm/index.html
+++ b/docs/normalization/instance_norm/index.html
@@ -350,19 +350,46 @@ i.e. the means for each feature $\mathbb{E}[(x_{t,i}^2]$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/instance_norm/readme.html b/docs/normalization/instance_norm/readme.html
index 47df63d5..fb7400c2 100644
--- a/docs/normalization/instance_norm/readme.html
+++ b/docs/normalization/instance_norm/readme.html
@@ -102,19 +102,46 @@ introduces instance normalization which does that.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/layer_norm/index.html b/docs/normalization/layer_norm/index.html
index 9bb9c800..3a8888a1 100644
--- a/docs/normalization/layer_norm/index.html
+++ b/docs/normalization/layer_norm/index.html
@@ -352,19 +352,46 @@ i.e. the means for each element $\mathbb{E}[X^2]$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/layer_norm/readme.html b/docs/normalization/layer_norm/readme.html
index 7df71ed8..6dea7db6 100644
--- a/docs/normalization/layer_norm/readme.html
+++ b/docs/normalization/layer_norm/readme.html
@@ -116,19 +116,46 @@ Layer normalization does it for each batch across all elements.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/weight_standardization/conv2d.html b/docs/normalization/weight_standardization/conv2d.html
index 3f7504ae..96d884f7 100644
--- a/docs/normalization/weight_standardization/conv2d.html
+++ b/docs/normalization/weight_standardization/conv2d.html
@@ -182,19 +182,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/weight_standardization/experiment.html b/docs/normalization/weight_standardization/experiment.html
index be25927f..9b253b78 100644
--- a/docs/normalization/weight_standardization/experiment.html
+++ b/docs/normalization/weight_standardization/experiment.html
@@ -249,19 +249,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/weight_standardization/index.html b/docs/normalization/weight_standardization/index.html
index 1fd20786..58774fe2 100644
--- a/docs/normalization/weight_standardization/index.html
+++ b/docs/normalization/weight_standardization/index.html
@@ -213,19 +213,46 @@ and $I$ is the number of input channels times the kernel size ($I = C_{in} \time
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/normalization/weight_standardization/readme.html b/docs/normalization/weight_standardization/readme.html
index 09f5e947..a8aa3c59 100644
--- a/docs/normalization/weight_standardization/readme.html
+++ b/docs/normalization/weight_standardization/readme.html
@@ -100,19 +100,46 @@ We also have an
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/ada_belief.html b/docs/optimizers/ada_belief.html
index 2b635e1f..a38a871c 100644
--- a/docs/optimizers/ada_belief.html
+++ b/docs/optimizers/ada_belief.html
@@ -448,19 +448,46 @@ $\color{cyan}{s_t} + \color{red}{\epsilon}$ in place of $v_t$.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/adam.html b/docs/optimizers/adam.html
index d20cc3a0..0c7cc7d2 100644
--- a/docs/optimizers/adam.html
+++ b/docs/optimizers/adam.html
@@ -558,19 +558,46 @@ is what we should specify as the hyper-parameter.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/adam_warmup.html b/docs/optimizers/adam_warmup.html
index 53fabc0b..bfa65785 100644
--- a/docs/optimizers/adam_warmup.html
+++ b/docs/optimizers/adam_warmup.html
@@ -199,19 +199,46 @@ where $w$ is the number of warmup steps.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/adam_warmup_cosine_decay.html b/docs/optimizers/adam_warmup_cosine_decay.html
index f7de4b9c..6cb5783a 100644
--- a/docs/optimizers/adam_warmup_cosine_decay.html
+++ b/docs/optimizers/adam_warmup_cosine_decay.html
@@ -249,19 +249,46 @@ where $w$ is the number of warmup steps.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/amsgrad.html b/docs/optimizers/amsgrad.html
index 37925234..49bd1f02 100644
--- a/docs/optimizers/amsgrad.html
+++ b/docs/optimizers/amsgrad.html
@@ -526,19 +526,46 @@ You can see that AMSGrad converges to true optimal $x = -1$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/configs.html b/docs/optimizers/configs.html
index ec4b2a2f..0c650059 100644
--- a/docs/optimizers/configs.html
+++ b/docs/optimizers/configs.html
@@ -395,19 +395,46 @@ i.e. weight decay is not added to gradients</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/index.html b/docs/optimizers/index.html
index 3022a8b6..d9e1ae76 100644
--- a/docs/optimizers/index.html
+++ b/docs/optimizers/index.html
@@ -531,19 +531,46 @@ when the decay is performed directly on the parameter. If this is false the actu
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/mnist_experiment.html b/docs/optimizers/mnist_experiment.html
index 40544253..0f6f2213 100644
--- a/docs/optimizers/mnist_experiment.html
+++ b/docs/optimizers/mnist_experiment.html
@@ -414,19 +414,46 @@ We can change the optimizer type and hyper-parameters using configurations.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/noam.html b/docs/optimizers/noam.html
index dc574bf1..9fdfa52a 100644
--- a/docs/optimizers/noam.html
+++ b/docs/optimizers/noam.html
@@ -233,19 +233,46 @@ where $w$ is the number of warmup steps.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/performance_test.html b/docs/optimizers/performance_test.html
index 5ceae84a..eba217ae 100644
--- a/docs/optimizers/performance_test.html
+++ b/docs/optimizers/performance_test.html
@@ -146,19 +146,46 @@ MyAdam...[DONE] 1,192.89ms
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/radam.html b/docs/optimizers/radam.html
index 7f9ec311..232d9d0a 100644
--- a/docs/optimizers/radam.html
+++ b/docs/optimizers/radam.html
@@ -629,19 +629,46 @@ $\theta_t \leftarrow \theta_{t-1} - \alpha \cdot \hat{m}_t$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/optimizers/readme.html b/docs/optimizers/readme.html
index 48879226..31ea6c0d 100644
--- a/docs/optimizers/readme.html
+++ b/docs/optimizers/readme.html
@@ -104,19 +104,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/pylit.css b/docs/pylit.css
index e7ed7044..3b70fffe 100644
--- a/docs/pylit.css
+++ b/docs/pylit.css
@@ -459,28 +459,77 @@ span.lineno {
   color: #bd93f9;
 }
 
-:root {
-  --blue: #007bff;
-  --indigo: #6610f2;
-  --purple: #6f42c1;
-  --pink: #e83e8c;
-  --red: #dc3545;
-  --orange: #fd7e14;
-  --yellow: #ffc107;
-  --green: #28a745;
-  --teal: #20c997;
-  --cyan: #17a2b8;
-  --white: #fff;
-  --gray: #6c757d;
-  --gray-dark: #343a40;
-  --primary: #007bff;
-  --secondary: #6c757d;
-  --success: #28a745;
-  --info: #17a2b8;
-  --warning: #ffc107;
-  --danger: #dc3545;
-  --light: #f8f9fa;
-  --dark: #343a40;
+p > img {
+  max-height: 240px;
+  max-width: 240px;
+  border-radius: 5px;
+  cursor: pointer;
+  transition: 0.3s;
+}
+p > img:hover {
+  opacity: 0.7;
+}
+
+#modal {
+  position: fixed;
+  z-index: 1000;
+  left: 0;
+  top: 0;
+  right: 0;
+  bottom: 0;
+  overflow: scroll;
+  background-color: rgba(0, 0, 0, 0.9);
+}
+#modal > div {
+  padding: 100px 10px 10px 10px;
+}
+#modal > div > img {
+  margin: auto;
+  display: block;
+  width: 80%;
+  max-width: 700px;
+}
+#modal > div > p {
+  margin: auto;
+  display: block;
+  width: 80%;
+  max-width: 700px;
+  text-align: center;
+  color: #ccc;
+  padding: 10px 0;
+  height: 150px;
+}
+#modal > div > img, #modal > div > p {
+  animation-name: zoom;
+  animation-duration: 0.6s;
+}
+@keyframes zoom {
+  from {
+    transform: scale(0);
+  }
+  to {
+    transform: scale(1);
+  }
+}
+#modal > span.close {
+  position: absolute;
+  top: 15px;
+  right: 35px;
+  color: #f1f1f1;
+  font-size: 40px;
+  font-weight: bold;
+  transition: 0.3s;
+}
+#modal > span.close:hover, #modal > span.close:focus {
+  color: #bbb;
+  text-decoration: none;
+  cursor: pointer;
+}
+
+@media only screen and (max-width: 700px) {
+  #modal > img {
+    width: 100%;
+  }
 }
 
 /*# sourceMappingURL=pylit.css.map */
diff --git a/docs/recurrent_highway_networks/index.html b/docs/recurrent_highway_networks/index.html
index 19c22847..0819c0c4 100644
--- a/docs/recurrent_highway_networks/index.html
+++ b/docs/recurrent_highway_networks/index.html
@@ -460,19 +460,46 @@ Rest of the layers get the input from the layer below</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/index.html b/docs/resnets/index.html
index b90ff0a6..57da1527 100644
--- a/docs/resnets/index.html
+++ b/docs/resnets/index.html
@@ -84,19 +84,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/models/index.html b/docs/resnets/models/index.html
index 65187660..e1da8625 100644
--- a/docs/resnets/models/index.html
+++ b/docs/resnets/models/index.html
@@ -85,19 +85,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/models/mlp.html b/docs/resnets/models/mlp.html
index c105f42d..1754bcde 100644
--- a/docs/resnets/models/mlp.html
+++ b/docs/resnets/models/mlp.html
@@ -304,19 +304,46 @@ Also convert into float for FC layer</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/models/resnet.html b/docs/resnets/models/resnet.html
index 1c068168..c015b100 100644
--- a/docs/resnets/models/resnet.html
+++ b/docs/resnets/models/resnet.html
@@ -531,19 +531,46 @@ Calculate the output shape after applying a convolution</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/pretrained_nets.html b/docs/resnets/pretrained_nets.html
index 2c4afcf7..71cf11f5 100644
--- a/docs/resnets/pretrained_nets.html
+++ b/docs/resnets/pretrained_nets.html
@@ -254,19 +254,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/resnet_net.html b/docs/resnets/resnet_net.html
index ee261ff3..1fa29455 100644
--- a/docs/resnets/resnet_net.html
+++ b/docs/resnets/resnet_net.html
@@ -253,19 +253,46 @@ Calculate the input shape</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/utils/index.html b/docs/resnets/utils/index.html
index 22ebf200..73e81d54 100644
--- a/docs/resnets/utils/index.html
+++ b/docs/resnets/utils/index.html
@@ -85,19 +85,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/utils/labelsmoothing.html b/docs/resnets/utils/labelsmoothing.html
index f651c6c6..acf7a0de 100644
--- a/docs/resnets/utils/labelsmoothing.html
+++ b/docs/resnets/utils/labelsmoothing.html
@@ -139,19 +139,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/utils/train.html b/docs/resnets/utils/train.html
index 1d01632a..3f3bba24 100644
--- a/docs/resnets/utils/train.html
+++ b/docs/resnets/utils/train.html
@@ -376,19 +376,46 @@ from torch.utils.data.sampler import SubsetRandomSampler</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/resnets/utils/utils.html b/docs/resnets/utils/utils.html
index 4de8c275..afa01710 100644
--- a/docs/resnets/utils/utils.html
+++ b/docs/resnets/utils/utils.html
@@ -224,19 +224,46 @@ subplot integers:
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/dqn/experiment.html b/docs/rl/dqn/experiment.html
index 8ea78c0d..b7a7814f 100644
--- a/docs/rl/dqn/experiment.html
+++ b/docs/rl/dqn/experiment.html
@@ -930,19 +930,46 @@ Gradients shouldn&rsquo;t propagate for these</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/dqn/index.html b/docs/rl/dqn/index.html
index ff168d72..ded1f393 100644
--- a/docs/rl/dqn/index.html
+++ b/docs/rl/dqn/index.html
@@ -337,19 +337,46 @@ mean squared error loss because it is less sensitive to outliers</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/dqn/model.html b/docs/rl/dqn/model.html
index c80d2a6c..a7dc0232 100644
--- a/docs/rl/dqn/model.html
+++ b/docs/rl/dqn/model.html
@@ -322,19 +322,46 @@ $512$ features</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/dqn/replay_buffer.html b/docs/rl/dqn/replay_buffer.html
index 2e4bca65..fea0b3d0 100644
--- a/docs/rl/dqn/replay_buffer.html
+++ b/docs/rl/dqn/replay_buffer.html
@@ -775,19 +775,46 @@ to get the index of actual value</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/game.html b/docs/rl/game.html
index e45e712c..a55a9694 100644
--- a/docs/rl/game.html
+++ b/docs/rl/game.html
@@ -461,19 +461,46 @@ i.e, each channel is a frame.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/index.html b/docs/rl/index.html
index 28656992..6aaacbd5 100644
--- a/docs/rl/index.html
+++ b/docs/rl/index.html
@@ -109,19 +109,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/ppo/experiment.html b/docs/rl/ppo/experiment.html
index a826c552..a2037b1c 100644
--- a/docs/rl/ppo/experiment.html
+++ b/docs/rl/ppo/experiment.html
@@ -1282,19 +1282,46 @@ You can change this while the experiment is running.
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/ppo/gae.html b/docs/rl/ppo/gae.html
index cb7ca228..976623f4 100644
--- a/docs/rl/ppo/gae.html
+++ b/docs/rl/ppo/gae.html
@@ -245,19 +245,46 @@ The performance of the model was improving
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/ppo/index.html b/docs/rl/ppo/index.html
index a894a8ea..03444f71 100644
--- a/docs/rl/ppo/index.html
+++ b/docs/rl/ppo/index.html
@@ -337,19 +337,46 @@ V^{\pi_\theta}_{CLIP}(s_t)
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/rl/ppo/readme.html b/docs/rl/ppo/readme.html
index e9e38a9b..c29a21c0 100644
--- a/docs/rl/ppo/readme.html
+++ b/docs/rl/ppo/readme.html
@@ -110,19 +110,46 @@ The experiment uses <a href="https://nn.labml.ai/rl/ppo/gae.html">Generalized Ad
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/sitemap.xml b/docs/sitemap.xml
index c729294a..80a4d1a5 100644
--- a/docs/sitemap.xml
+++ b/docs/sitemap.xml
@@ -104,6 +104,20 @@
     </url>
     
 
+    <url>
+      <loc>https://nn.labml.ai/gan/stylegan/index.html</loc>
+      <lastmod>2021-05-21T16:30:00+00:00</lastmod>
+      <priority>1.00</priority>
+    </url>
+    
+
+    <url>
+      <loc>https://nn.labml.ai/gan/stylegan/experiment.html</loc>
+      <lastmod>2021-05-21T16:30:00+00:00</lastmod>
+      <priority>1.00</priority>
+    </url>
+    
+
     <url>
       <loc>https://nn.labml.ai/gan/cycle_gan/experiment.html</loc>
       <lastmod>2021-05-07T16:30:00+00:00</lastmod>
@@ -127,7 +141,7 @@
 
     <url>
       <loc>https://nn.labml.ai/gan/index.html</loc>
-      <lastmod>2021-05-07T16:30:00+00:00</lastmod>
+      <lastmod>2021-05-09T16:30:00+00:00</lastmod>
       <priority>1.00</priority>
     </url>
     
@@ -428,7 +442,7 @@
 
     <url>
       <loc>https://nn.labml.ai/index.html</loc>
-      <lastmod>2021-05-07T16:30:00+00:00</lastmod>
+      <lastmod>2021-05-09T16:30:00+00:00</lastmod>
       <priority>1.00</priority>
     </url>
     
@@ -862,7 +876,7 @@
 
     <url>
       <loc>https://nn.labml.ai/utils.html</loc>
-      <lastmod>2021-02-17T16:30:00+00:00</lastmod>
+      <lastmod>2021-05-21T16:30:00+00:00</lastmod>
       <priority>1.00</priority>
     </url>
     
diff --git a/docs/sketch_rnn/index.html b/docs/sketch_rnn/index.html
index ab6a70bd..13554a06 100644
--- a/docs/sketch_rnn/index.html
+++ b/docs/sketch_rnn/index.html
@@ -2103,19 +2103,46 @@ Paper had suggested <code>1e-4</code>.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/compressive/experiment.html b/docs/transformers/compressive/experiment.html
index 94b8fbe8..4bcba56a 100644
--- a/docs/transformers/compressive/experiment.html
+++ b/docs/transformers/compressive/experiment.html
@@ -1309,19 +1309,46 @@ Memories that were compressed are needed for the reconstruction loss computation
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/compressive/index.html b/docs/transformers/compressive/index.html
index be44b9cb..e1790845 100644
--- a/docs/transformers/compressive/index.html
+++ b/docs/transformers/compressive/index.html
@@ -927,19 +927,46 @@ The parameters of $f_c^{(i)}$ are the only parameters not detached from gradient
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/compressive/readme.html b/docs/transformers/compressive/readme.html
index 66b73b03..92901073 100644
--- a/docs/transformers/compressive/readme.html
+++ b/docs/transformers/compressive/readme.html
@@ -129,19 +129,46 @@ model on the Tiny Shakespeare dataset.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/configs.html b/docs/transformers/configs.html
index e6993833..c4e80918 100644
--- a/docs/transformers/configs.html
+++ b/docs/transformers/configs.html
@@ -950,19 +950,46 @@ are calculated.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/fast_weights/experiment.html b/docs/transformers/fast_weights/experiment.html
index 0e7d4c35..728da48b 100644
--- a/docs/transformers/fast_weights/experiment.html
+++ b/docs/transformers/fast_weights/experiment.html
@@ -356,19 +356,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/fast_weights/index.html b/docs/transformers/fast_weights/index.html
index e18314aa..c24a6d5b 100644
--- a/docs/transformers/fast_weights/index.html
+++ b/docs/transformers/fast_weights/index.html
@@ -885,19 +885,46 @@ y^{(i)} &= \color{cyan}{W^{(i)}} \color{lightgreen}{\phi'(q^{(i)})}
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/fast_weights/readme.html b/docs/transformers/fast_weights/readme.html
index b716be72..341c11ab 100644
--- a/docs/transformers/fast_weights/readme.html
+++ b/docs/transformers/fast_weights/readme.html
@@ -103,19 +103,46 @@ and a notebook for training a fast weights transformer on the Tiny Shakespeare d
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/fast_weights/token_wise.html b/docs/transformers/fast_weights/token_wise.html
index 00dbefa0..2474a782 100644
--- a/docs/transformers/fast_weights/token_wise.html
+++ b/docs/transformers/fast_weights/token_wise.html
@@ -514,19 +514,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/feed_forward.html b/docs/transformers/feed_forward.html
index 9420233f..feccc807 100644
--- a/docs/transformers/feed_forward.html
+++ b/docs/transformers/feed_forward.html
@@ -305,19 +305,46 @@ depending on whether it is gated</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/feedback/README.html b/docs/transformers/feedback/README.html
index d3ac481c..abfcabe6 100644
--- a/docs/transformers/feedback/README.html
+++ b/docs/transformers/feedback/README.html
@@ -122,19 +122,46 @@ We implemented a custom PyTorch function to improve performance.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/feedback/experiment.html b/docs/transformers/feedback/experiment.html
index d9e56278..9346fe70 100644
--- a/docs/transformers/feedback/experiment.html
+++ b/docs/transformers/feedback/experiment.html
@@ -404,19 +404,46 @@ where the keys and values are precalculated.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/feedback/index.html b/docs/transformers/feedback/index.html
index 46d9a107..2249c9f1 100644
--- a/docs/transformers/feedback/index.html
+++ b/docs/transformers/feedback/index.html
@@ -1695,19 +1695,46 @@ This is the weights parameter for that.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/glu_variants/experiment.html b/docs/transformers/glu_variants/experiment.html
index 57e7b31e..73e70aae 100644
--- a/docs/transformers/glu_variants/experiment.html
+++ b/docs/transformers/glu_variants/experiment.html
@@ -437,19 +437,46 @@ implementation</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/glu_variants/index.html b/docs/transformers/glu_variants/index.html
index 83b154ff..06a5da59 100644
--- a/docs/transformers/glu_variants/index.html
+++ b/docs/transformers/glu_variants/index.html
@@ -100,19 +100,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/glu_variants/simple.html b/docs/transformers/glu_variants/simple.html
index 7ed19603..89c9b7da 100644
--- a/docs/transformers/glu_variants/simple.html
+++ b/docs/transformers/glu_variants/simple.html
@@ -1113,19 +1113,46 @@ a linear layer to generate logits.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/gpt/index.html b/docs/transformers/gpt/index.html
index 01a130ef..4bb11bd0 100644
--- a/docs/transformers/gpt/index.html
+++ b/docs/transformers/gpt/index.html
@@ -849,19 +849,46 @@ per epoch</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/index.html b/docs/transformers/index.html
index 243f572e..a9ef14de 100644
--- a/docs/transformers/index.html
+++ b/docs/transformers/index.html
@@ -133,19 +133,46 @@ It does single GPU training but we implement the concept of switching as describ
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/knn/build_index.html b/docs/transformers/knn/build_index.html
index f93f18c6..411d26f8 100644
--- a/docs/transformers/knn/build_index.html
+++ b/docs/transformers/knn/build_index.html
@@ -594,19 +594,46 @@ doesn&rsquo;t store full vectors.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/knn/eval_knn.html b/docs/transformers/knn/eval_knn.html
index f532bfce..fbae5e12 100644
--- a/docs/transformers/knn/eval_knn.html
+++ b/docs/transformers/knn/eval_knn.html
@@ -554,19 +554,46 @@ each of the weights</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/knn/index.html b/docs/transformers/knn/index.html
index 36c9a387..cf8a01ed 100644
--- a/docs/transformers/knn/index.html
+++ b/docs/transformers/knn/index.html
@@ -119,19 +119,46 @@ of disk space for the index.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/knn/train_model.html b/docs/transformers/knn/train_model.html
index 14c0dddb..3e71b8fc 100644
--- a/docs/transformers/knn/train_model.html
+++ b/docs/transformers/knn/train_model.html
@@ -486,19 +486,46 @@ final token generator from configurable transformer</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/label_smoothing_loss.html b/docs/transformers/label_smoothing_loss.html
index 0bd0d15e..42006422 100644
--- a/docs/transformers/label_smoothing_loss.html
+++ b/docs/transformers/label_smoothing_loss.html
@@ -214,19 +214,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/mha.html b/docs/transformers/mha.html
index a4553a63..d749979f 100644
--- a/docs/transformers/mha.html
+++ b/docs/transformers/mha.html
@@ -574,19 +574,46 @@ $\underset{seq}{softmax}\Bigg(\frac{Q K^\top}{\sqrt{d_k}}\Bigg)$</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/models.html b/docs/transformers/models.html
index 15f793cb..cbd5f4a8 100644
--- a/docs/transformers/models.html
+++ b/docs/transformers/models.html
@@ -705,19 +705,46 @@ Initialize parameters with Glorot / fan_avg.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/positional_encoding.html b/docs/transformers/positional_encoding.html
index 584ee620..f536f01e 100644
--- a/docs/transformers/positional_encoding.html
+++ b/docs/transformers/positional_encoding.html
@@ -265,19 +265,46 @@ PE_{p,2i + 1} &= cos\Bigg(\frac{p}{10000^{\frac{2i}{d_{model}}}}\Bigg)
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/relative_mha.html b/docs/transformers/relative_mha.html
index fd3f7414..85a9cca3 100644
--- a/docs/transformers/relative_mha.html
+++ b/docs/transformers/relative_mha.html
@@ -4,7 +4,7 @@
     <meta http-equiv="content-type" content="text/html;charset=utf-8"/>
     <meta name="viewport" content="width=device-width, initial-scale=1.0"/>
     <meta name="description" content="Relative Multi-Headed Attention from paper Transformer-XL."/>
-    <meta http-equiv="refresh" content="0; URL=https://nn.labml.ai/transformers/xl/relative_mha.html" />
+    <meta http-equiv="refresh" content="0; URL=https://nn.labml.ai/transformers/xl/relative_mha.html"/>
 
     <meta name="twitter:card" content="summary"/>
     <meta name="twitter:image:src" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
@@ -85,19 +85,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/switch/experiment.html b/docs/transformers/switch/experiment.html
index ba225c83..bd34fbb2 100644
--- a/docs/transformers/switch/experiment.html
+++ b/docs/transformers/switch/experiment.html
@@ -806,19 +806,46 @@ set to something small like $\alpha = 0.01$.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/switch/index.html b/docs/transformers/switch/index.html
index 279ab732..15ed6649 100644
--- a/docs/transformers/switch/index.html
+++ b/docs/transformers/switch/index.html
@@ -711,19 +711,46 @@ with handling extra outputs of switch feedforward module.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/switch/readme.html b/docs/transformers/switch/readme.html
index ea5d5a4d..5b18542b 100644
--- a/docs/transformers/switch/readme.html
+++ b/docs/transformers/switch/readme.html
@@ -119,19 +119,46 @@ discusses dropping tokens when routing is not balanced.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/utils.html b/docs/transformers/utils.html
index 972ea98b..5f28119e 100644
--- a/docs/transformers/utils.html
+++ b/docs/transformers/utils.html
@@ -135,19 +135,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/xl/experiment.html b/docs/transformers/xl/experiment.html
index 49e9cad1..60ca545c 100644
--- a/docs/transformers/xl/experiment.html
+++ b/docs/transformers/xl/experiment.html
@@ -988,19 +988,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/xl/index.html b/docs/transformers/xl/index.html
index a3ab5c4b..f657c2cd 100644
--- a/docs/transformers/xl/index.html
+++ b/docs/transformers/xl/index.html
@@ -441,19 +441,46 @@ which will become the memories for the next sequential batch.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/xl/readme.html b/docs/transformers/xl/readme.html
index 5c476e39..ef974df3 100644
--- a/docs/transformers/xl/readme.html
+++ b/docs/transformers/xl/readme.html
@@ -114,19 +114,46 @@ are introduced at the attention calculation.</p>
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/transformers/xl/relative_mha.html b/docs/transformers/xl/relative_mha.html
index 915b7bc6..f68b99f2 100644
--- a/docs/transformers/xl/relative_mha.html
+++ b/docs/transformers/xl/relative_mha.html
@@ -411,19 +411,46 @@ to get <script type="math/tex; mode=display">\color{lightgreen}{\mathbf{(B + D)}
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/docs/utils.html b/docs/utils.html
index 0177e8c7..a30a2fd6 100644
--- a/docs/utils.html
+++ b/docs/utils.html
@@ -83,7 +83,8 @@
                 <div class='section-link'>
                     <a href='#section-1'>#</a>
                 </div>
-                <h2>Make a <code>nn.ModuleList</code> with clones of a given layer</h2>
+                <h2>Clone Module</h2>
+<p>Make a <code>nn.ModuleList</code> with clones of a given module</p>
             </div>
             <div class='code'>
                 <div class="highlight"><pre><span class="lineno">15</span><span class="k">def</span> <span class="nf">clone_module_list</span><span class="p">(</span><span class="n">module</span><span class="p">:</span> <span class="n">M</span><span class="p">,</span> <span class="n">n</span><span class="p">:</span> <span class="nb">int</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">TypedModuleList</span><span class="p">[</span><span class="n">M</span><span class="p">]:</span></pre></div>
@@ -97,7 +98,33 @@
                 
             </div>
             <div class='code'>
-                <div class="highlight"><pre><span class="lineno">19</span>    <span class="k">return</span> <span class="n">TypedModuleList</span><span class="p">([</span><span class="n">copy</span><span class="o">.</span><span class="n">deepcopy</span><span class="p">(</span><span class="n">module</span><span class="p">)</span> <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">n</span><span class="p">)])</span></pre></div>
+                <div class="highlight"><pre><span class="lineno">21</span>    <span class="k">return</span> <span class="n">TypedModuleList</span><span class="p">([</span><span class="n">copy</span><span class="o">.</span><span class="n">deepcopy</span><span class="p">(</span><span class="n">module</span><span class="p">)</span> <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">n</span><span class="p">)])</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-3'>
+        <div class='docs doc-strings'>
+                <div class='section-link'>
+                    <a href='#section-3'>#</a>
+                </div>
+                <p><a id="cycle_dataloader"></a></p>
+<h2>Cycle Data Loader</h2>
+<p>Infinite loader that recycles the data loader after each epoch</p>
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">24</span><span class="k">def</span> <span class="nf">cycle_dataloader</span><span class="p">(</span><span class="n">data_loader</span><span class="p">):</span></pre></div>
+            </div>
+        </div>
+    <div class='section' id='section-4'>
+            <div class='docs'>
+                <div class='section-link'>
+                    <a href='#section-4'>#</a>
+                </div>
+                
+            </div>
+            <div class='code'>
+                <div class="highlight"><pre><span class="lineno">31</span>    <span class="k">while</span> <span class="kc">True</span><span class="p">:</span>
+<span class="lineno">32</span>        <span class="k">for</span> <span class="n">batch</span> <span class="ow">in</span> <span class="n">data_loader</span><span class="p">:</span>
+<span class="lineno">33</span>            <span class="k">yield</span> <span class="n">batch</span></pre></div>
             </div>
         </div>
     </div>
@@ -118,19 +145,46 @@
         displayAlign: 'center',
         "HTML-CSS": { fonts: ["TeX"] }
     });
+</script>
+<script>
+    function handleImages() {
+        var images = document.querySelectorAll('p>img')
 
+        console.log(images);
+        for (var i = 0; i < images.length; ++i) {
+            handleImage(images[i])
+        }
+    }
 
+    function handleImage(img) {
+        img.parentElement.style.textAlign = 'center'
 
+        var modal = document.createElement('div')
+        modal.id = 'modal'
 
+        var modalContent = document.createElement('div')
+        modal.appendChild(modalContent)
 
+        var modalImage = document.createElement('img')
+        modalContent.appendChild(modalImage)
 
+        var span = document.createElement('span')
+        span.classList.add('close')
+        span.textContent = 'x'
+        modal.appendChild(span)
 
+        img.onclick = function () {
+            console.log('clicked')
+            document.body.appendChild(modal)
+            modalImage.src = img.src
+        }
 
+        span.onclick = function () {
+            document.body.removeChild(modal)
+        }
+    }
 
-
-
-
-
+    handleImages()
 </script>
 </body>
 </html>
\ No newline at end of file
diff --git a/labml_nn/gan/stylegan/__init__.py b/labml_nn/gan/stylegan/__init__.py
new file mode 100644
index 00000000..570216b0
--- /dev/null
+++ b/labml_nn/gan/stylegan/__init__.py
@@ -0,0 +1,947 @@
+"""
+---
+title: Style GAN 2
+summary: >
+ An annotated PyTorch implementation of StyleGAN2.
+---
+
+# Style GAN 2
+
+This is a [PyTorch](https://pytorch.org) implementation of the paper
+ [Analyzing and Improving the Image Quality of StyleGAN](https://arxiv.org/abs/1912.04958)
+ which introduces **Style GAN2**.
+Style GAN2 is an improvement over **Style GAN** from the paper
+ [A Style-Based Generator Architecture for Generative Adversarial Networks](https://arxiv.org/abs/1812.04948).
+And Style GAN is based on **Progressive GAN** from the paper
+ [Progressive Growing of GANs for Improved Quality, Stability, and Variation](https://arxiv.org/abs/1710.10196).
+All three papers are from the same authors from [NVIDIA AI](https://twitter.com/NVIDIAAI).
+
+*Our implementation is a minimalistic Style GAN2 model training code.
+Only single GPU training is supported to keep the implementation simple.
+We managed to shrink it to keep it at less than 500 lines of code, including the training loop.*
+
+**🏃 Here's the training code: [`experiment.py`](experiment.html).**
+
+![Generated Images](generated_64.png)
+
+*<small>These are $64 \times 64$ images generated after training for about 80K steps.</small>*
+
+
+We'll first introduce the three papers at a high level.
+
+## Generative Adversarial Networks
+
+Generative adversarial networks have two components; the generator and the discriminator.
+The generator network takes a random latent vector ($z \in \mathcal{Z}$)
+ and tries to generate a realistic image.
+The discriminator network tries to differentiate the real images from generated images.
+When we train the two networks together the generator starts generating images indistinguishable from real images.
+
+## Progressive GAN
+
+Progressive GAN generates high-resolution images ($1080 \times 1080$) of size.
+It does so by *progressively* increasing the image size.
+First, it trains a network that produces a $4 \times 4$ image, then $8 \times 8$ ,
+ then an $16 \times 16$  image, and so on up to the desired image resolution.
+
+At each resolution, the generator network produces an image in latent space which is converted into RGB,
+with a $1 \times 1$  convolution.
+When we progress from a lower resolution to a higher resolution
+ (say from $4 \times 4$  to $8 \times 8$ ) we scale the latent image by $2\times$
+ and add a new block (two $3 \times 3$  convolution layers)
+ and a new $1 \times 1$  layer to get RGB.
+The transition is done smoothly by adding a residual connection to
+ the $2\times$ scaled $4 \times 4$  RGB image.
+The weight of this residual connection is slowly reduced, to let the new block take over.
+
+The discriminator is a mirror image of the generator network.
+The progressive growth of the discriminator is done similarly.
+
+![progressive_gan.svg](progressive_gan.svg)
+
+*<small>$2\times$ and $0.5\times$ denote feature map resolution scaling and scaling.
+$4\times4$, $8\times4$, ... denote feature map resolution at the generator or discriminator block.
+Each discriminator and generator block consists of 2 convolution layers with leaky ReLU activations.</small>*
+
+They use **minibatch standard deviation** to increase variation and
+ **equalized learning rate** which we discussed below in the implementation.
+They also use **pixel-wise normalization** where at each pixel the feature vector is normalized.
+They apply this to all the convolution layer outputs (except RGB).
+
+
+## Style GAN
+
+Style GAN improves the generator of Progressive GAN keeping the discriminator architecture the same.
+
+#### Mapping Network
+
+It maps the random latent vector ($z \in \mathcal{Z}$)
+ into a different latent space ($w \in \mathcal{W}$),
+ with an 8-layer neural network.
+This gives an intermediate latent space $\mathcal{W}$
+where the factors of variations are more linear (disentangled).
+
+#### AdaIN
+
+Then $w$ is transformed into two vectors (***styles***) per layer,
+ $i$, $y_i = (y_{s,i}, y_{b,i}) = f_{A_i}(w)$ and used for scaling and shifting (biasing)
+ in each layer with $\text{AdaIN}$ operator (normalize and scale):
+$$\text{AdaIN}(x_i, y_i) = y_{s, i} \frac{x_i - \mu(x_i)}{\sigma(x_i)} + y_{b,i}$$
+
+#### Style Mixing
+
+To prevent the generator from assuming adjacent styles are correlated,
+ they randomly use different styles for different blocks.
+That is, they sample two latent vectors $(z_1, z_2)$ and corresponding $(w_1, w_2)$ and
+ use $w_1$ based styles for some blocks and $w_2$ based styles for some blacks randomly.
+
+#### Stochastic Variation
+
+Noise is made available to each block which helps the generator create more realistic images.
+Noise is scaled per channel by a learned weight.
+
+#### Bilinear Up and Down Sampling
+
+All the up and down-sampling operations are accompanied by bilinear smoothing.
+
+![style_gan.svg](style_gan.svg)
+
+*<small>$A$ denotes a linear layer.
+$B$ denotes a broadcast and scaling operation (noise is a single channel).
+Style GAN also uses progressive growing like Progressive GAN</small>*
+
+## Style GAN 2
+
+Style GAN 2 changes both the generator and the discriminator of Style GAN.
+
+#### Weight Modulation and Demodulation
+
+They remove the $\text{AdaIN}$ operator and replace it with
+ the weight modulation and demodulation step.
+This is supposed to improve what they call droplet artifacts that are present in generated images,
+ which are caused by the normalization in $\text{AdaIN}$ operator.
+Style vector per layer is calculated from $w_i \in \mathcal{W}$ as $s_i = f_{A_i}(w_i)$.
+
+Then the convolution weights $w$ are modulated as follows.
+($w$ here on refers to weights not intermediate latent space,
+ we are sticking to the same notation as the paper.)
+
+$$w'_{i, j, k} = s_i \cdot w_{i, j, k}$$
+Then it's demodulated by normalizing,
+$$w''_{i,j,k} = \frac{w'_{i,j,k}}{\sqrt{\sum_{i,k}{w'_{i, j, k}}^2 + \epsilon}}$$
+where $i$ is the input channel, $j$ is the output channel, and $k$ is the kernel index.
+
+#### Path Length Regularization
+
+Path length regularization encourages a fixed-size step in $\mathcal{W}$ to result in a non-zero,
+ fixed-magnitude change in the generated image.
+
+#### No Progressive Growing
+
+StyleGAN2 uses residual connections (with down-sampling) in the discriminator and skip connections
+ in the generator with up-sampling
+  (the RGB outputs from each layer are added - no residual connections in feature maps).
+They show that with experiments that the contribution of low-resolution layers is higher
+ at beginning of the training and then high-resolution layers take over.
+"""
+
+import math
+from typing import Tuple, Optional, List
+
+import numpy as np
+import torch
+import torch.nn.functional as F
+import torch.utils.data
+from torch import nn
+
+
+class MappingNetwork(nn.Module):
+    """
+    <a id="mapping_network"></a>
+    ## Mapping Network
+
+    ![Mapping Network](mapping_network.svg)
+
+    This is an MLP with 8 linear layers.
+    The mapping network maps the latent vector $z \in \mathcal{W}$
+    to an intermediate latent space $w \in \mathcal{W}$.
+    $\mathcal{W}$ space will be disentangled from the image space
+    where the factors of variation become more linear.
+    """
+
+    def __init__(self, features: int, n_layers: int):
+        """
+        * `features` is the number of features in $z$ and $w$
+        * `n_layers` is the number of layers in the mapping network.
+        """
+        super().__init__()
+
+        # Create the MLP
+        layers = []
+        for i in range(n_layers):
+            # [Equalized learning-rate linear layers](#equalized_linear)
+            layers.append(EqualizedLinear(features, features))
+            # Leaky Relu
+            layers.append(nn.LeakyReLU(negative_slope=0.2, inplace=True))
+
+        self.net = nn.Sequential(*layers)
+
+    def forward(self, z: torch.Tensor):
+        # Normalize $z$
+        z = F.normalize(z, dim=1)
+        # Map $z$ to $w$
+        return self.net(z)
+
+
+class Generator(nn.Module):
+    """
+    <a id="generator"></a>
+    ## StyleGAN2 Generator
+
+    ![Generator](style_gan2.svg)
+
+    *<small>$A$ denotes a linear layer.
+    $B$ denotes a broadcast and scaling operation (noise is a single channel).
+    [*toRGB*](#to_rgb) also has a style modulation which is not shown in the diagram to keep it simple.</small>*
+
+    The generator starts with a learned constant.
+    Then it has a series of blocks. The feature map resolution is doubled at each block
+    Each block outputs an RGB image and they are scaled up and summed to get the final RGB image.
+    """
+
+    def __init__(self, log_resolution: int, d_latent: int, n_features: int = 32, max_features: int = 512):
+        """
+        * `log_resolution` is the $\log_2$ of image resolution
+        * `d_latent` is the dimensionality of $w$
+        * `n_features` number of features in the convolution layer at the highest resolution (final block)
+        * `max_features` maximum number of features in any generator block
+        """
+        super().__init__()
+
+        # Calculate the number of features for each block
+        #
+        # Something like `[512, 512, 256, 128, 64, 32]`
+        features = [min(max_features, n_features * (2 ** i)) for i in range(log_resolution - 2, -1, -1)]
+        # Number of generator blocks
+        self.n_blocks = len(features)
+
+        # Trainable $4 \times 4$ constant
+        self.initial_constant = nn.Parameter(torch.randn((1, features[0], 4, 4)))
+
+        # First style block for $4 \times 4$ resolution and layer to get RGB
+        self.style_block = StyleBlock(d_latent, features[0], features[0])
+        self.to_rgb = ToRGB(d_latent, features[0])
+
+        # Generator blocks
+        blocks = [GeneratorBlock(d_latent, features[i - 1], features[i]) for i in range(1, self.n_blocks)]
+        self.blocks = nn.ModuleList(blocks)
+
+        # $2 \times$ up sampling layer. The feature space is up sampled
+        # at each block
+        self.up_sample = UpSample()
+
+    def forward(self, w: torch.Tensor, input_noise: List[Tuple[Optional[torch.Tensor], Optional[torch.Tensor]]]):
+        """
+        * `w` is $w$. In order to mix-styles (use different $w$ for different layers), we provide a separate
+        $w$ for each [generator block](#generator_block). It has shape `[n_blocks, batch_size, d_latent]1.
+        * `input_noise` is the noise for each block.
+        It's a list of pairs of noise sensors because each block (except the initial) has two noise inputs
+        after each convolution layer (see the diagram).
+        """
+
+        # Get batch size
+        batch_size = w.shape[1]
+
+        # Expand the learned constant to match batch size
+        x = self.initial_constant.expand(batch_size, -1, -1, -1)
+
+        # The first style block
+        x = self.style_block(x, w[0], input_noise[0][1])
+        # Get first rgb image
+        rgb = self.to_rgb(x, w[0])
+
+        # Evaluate rest of the blocks
+        for i in range(1, self.n_blocks):
+            # Up sample the feature map
+            x = self.up_sample(x)
+            # Run it through the [generator block](#generator_block)
+            x, rgb_new = self.blocks[i - 1](x, w[i], input_noise[i])
+            # Up sample the RGB image and add to the rgb from the block
+            rgb = self.up_sample(rgb) + rgb_new
+
+        # Return the final RGB image
+        return rgb
+
+
+class GeneratorBlock(nn.Module):
+    """
+    <a id="generator_block"></a>
+    ### Generator Block
+
+    ![Generator block](generator_block.svg)
+
+    *<small>$A$ denotes a linear layer.
+    $B$ denotes a broadcast and scaling operation (noise is a single channel).
+    [*toRGB*](#to_rgb) also has a style modulation which is not shown in the diagram to keep it simple.</small>*
+
+    The generator block consists of two [style blocks](#style_block) ($3 \times 3$ convolutions with style modulation)
+    and an RGB output.
+    """
+
+    def __init__(self, d_latent: int, in_features: int, out_features: int):
+        """
+        * `d_latent` is the dimensionality of $w$
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        """
+        super().__init__()
+
+        # First [style block](#style_block) changes the feature map size to `out_features`
+        self.style_block1 = StyleBlock(d_latent, in_features, out_features)
+        # Second [style block](#style_block)
+        self.style_block2 = StyleBlock(d_latent, out_features, out_features)
+
+        # *toRGB* layer
+        self.to_rgb = ToRGB(d_latent, out_features)
+
+    def forward(self, x: torch.Tensor, w: torch.Tensor, noise: Tuple[Optional[torch.Tensor], Optional[torch.Tensor]]):
+        """
+        * `x` is the input feature map of shape `[batch_size, in_features, height, width]`
+        * `w` is $w$ with shape `[batch_size, d_latent]`
+        * `noise` is a tuple of two noise tensors of shape `[batch_size, 1, height, width]`
+        """
+        # First style block with first noise tensor.
+        # The output is of shape `[batch_size, out_features, height, width]`
+        x = self.style_block1(x, w, noise[0])
+        # Second style block with second noise tensor.
+        # The output is of shape `[batch_size, out_features, height, width]`
+        x = self.style_block2(x, w, noise[1])
+
+        # Get RGB image
+        rgb = self.to_rgb(x, w)
+
+        # Return feature map and rgb image
+        return x, rgb
+
+
+class StyleBlock(nn.Module):
+    """
+    <a id="style_block"></a>
+    ### Style Block
+
+    ![Style block](style_block.svg)
+
+    *<small>$A$ denotes a linear layer.
+    $B$ denotes a broadcast and scaling operation (noise is single channel).</small>*
+
+    Style block has a weight modulation convolution layer.
+    """
+
+    def __init__(self, d_latent: int, in_features: int, out_features: int):
+        """
+        * `d_latent` is the dimensionality of $w$
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        """
+        super().__init__()
+        # Get style vector from $w$ (denoted by $A$ in the diagram) with
+        # an [equalized learning-rate linear layer](#equalized_linear)
+        self.to_style = EqualizedLinear(d_latent, in_features, bias=1.0)
+        # Weight modulated convolution layer
+        self.conv = Conv2dWeightModulate(in_features, out_features, kernel_size=3)
+        # Noise scale
+        self.scale_noise = nn.Parameter(torch.zeros(1))
+        # Bias
+        self.bias = nn.Parameter(torch.zeros(out_features))
+
+        # Activation function
+        self.activation = nn.LeakyReLU(0.2, True)
+
+    def forward(self, x: torch.Tensor, w: torch.Tensor, noise: Optional[torch.Tensor]):
+        """
+        * `x` is the input feature map of shape `[batch_size, in_features, height, width]`
+        * `w` is $w$ with shape `[batch_size, d_latent]`
+        * `noise` is a tensor of shape `[batch_size, 1, height, width]`
+        """
+        # Get style vector $s$
+        s = self.to_style(w)
+        # Weight modulated convolution
+        x = self.conv(x, s)
+        # Scale and add noise
+        if noise is not None:
+            x = x + self.scale_noise[None, :, None, None] * noise
+        # Add bias and evaluate activation function
+        return self.activation(x + self.bias[None, :, None, None])
+
+
+class ToRGB(nn.Module):
+    """
+    <a id="to_rgb"></a>
+    ### To RGB
+
+    ![To RGB](to_rgb.svg)
+
+    *<small>$A$ denotes a linear layer.</small>*
+
+    Generates an RGB image from a feature map using $1 \times 1$ convolution.
+    """
+
+    def __init__(self, d_latent: int, features: int):
+        """
+        * `d_latent` is the dimensionality of $w$
+        * `features` is the number of features in the feature map
+        """
+        super().__init__()
+        # Get style vector from $w$ (denoted by $A$ in the diagram) with
+        # an [equalized learning-rate linear layer](#equalized_linear)
+        self.to_style = EqualizedLinear(d_latent, features, bias=1.0)
+
+        # Weight modulated convolution layer without demodulation
+        self.conv = Conv2dWeightModulate(features, 3, kernel_size=1, demodulate=False)
+        # Bias
+        self.bias = nn.Parameter(torch.zeros(1))
+        # Activation function
+        self.activation = nn.LeakyReLU(0.2, True)
+
+    def forward(self, x: torch.Tensor, w: torch.Tensor):
+        """
+        * `x` is the input feature map of shape `[batch_size, in_features, height, width]`
+        * `w` is $w$ with shape `[batch_size, d_latent]`
+        """
+        # Get style vector $s$
+        style = self.to_style(w)
+        # Weight modulated convolution
+        x = self.conv(x, style)
+        # Add bias and evaluate activation function
+        return self.activation(x + self.bias[None, :, None, None])
+
+
+class Conv2dWeightModulate(nn.Module):
+    """
+    ### Convolution with Weight Modulation and Demodulation
+
+    This layer scales the convolution weights by the style vector and demodulates by normalizing it.
+    """
+
+    def __init__(self, in_features: int, out_features: int, kernel_size: int,
+                 demodulate: float = True, eps: float = 1e-8):
+        """
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        * `kernel_size` is the size of the convolution kernel
+        * `demodulate` is flag whether to normalize weights by its standard deviation
+        * `eps` is the $\epsilon$ for normalizing
+        """
+        super().__init__()
+        # Number of output features
+        self.out_features = out_features
+        # Whether to normalize weights
+        self.demodulate = demodulate
+        # Padding size
+        self.padding = (kernel_size - 1) // 2
+
+        # [Weights parameter with equalized learning rate](#equalized_weight)
+        self.weight = EqualizedWeight([out_features, in_features, kernel_size, kernel_size])
+        # $\epsilon$
+        self.eps = eps
+
+    def forward(self, x: torch.Tensor, s: torch.Tensor):
+        """
+        * `x` is the input feature map of shape `[batch_size, in_features, height, width]`
+        * `s` is style based scaling tensor of shape `[batch_size, in_features]`
+        """
+
+        # Get batch size, height and width
+        b, _, h, w = x.shape
+
+        # Reshape the scales
+        s = s[:, None, :, None, None]
+        # Get [learning rate equalized weights](#equalized_weight)
+        weights = self.weight()[None, :, :, :, :]
+        # $$w`_{i,j,k} = s_i * w_{i,j,k}$$
+        # where $i$ is the input channel, $j$ is the output channel, and $k$ is the kernel index.
+        #
+        # The result has shape `[batch_size, out_features, in_features, kernel_size, kernel_size]`
+        weights = weights * s
+
+        # Demodulate
+        if self.demodulate:
+            # $$\sigma_j = \sqrt{\sum_{i,k} (w'_{i, j, k})^2 + \epsilon}$$
+            sigma_inv = torch.rsqrt((weights ** 2).sum(dim=(2, 3, 4), keepdim=True) + self.eps)
+            # $$w''_{i,j,k} = \frac{w'_{i,j,k}}{\sqrt{\sum_{i,k} (w'_{i, j, k})^2 + \epsilon}}$$
+            weights = weights * sigma_inv
+
+        # Reshape `x`
+        x = x.reshape(1, -1, h, w)
+
+        # Reshape weights
+        _, _, *ws = weights.shape
+        weights = weights.reshape(b * self.out_features, *ws)
+
+        # Use grouped convolution to efficiently calculate the convolution with sample wise kernel.
+        # i.e. we have a different kernel (weights) for each sample in the batch
+        x = F.conv2d(x, weights, padding=self.padding, groups=b)
+
+        # Reshape `x` to `[batch_size, out_features, height, width]` and return
+        return x.reshape(-1, self.out_features, h, w)
+
+
+class Discriminator(nn.Module):
+    """
+    <a id="discriminator"></a>
+    ## Style GAN2 Discriminator
+
+    ![Discriminator](style_gan2_disc.svg)
+
+    Discriminator first transforms the image to a feature map of the same resolution and then
+    runs it through a series of blocks with residual connections.
+    The resolution is down-sampled by $2 \times$ at each block while doubling the
+    number of features.
+    """
+
+    def __init__(self, log_resolution: int, n_features: int = 64, max_features: int = 512):
+        """
+        * `log_resolution` is the $\log_2$ of image resolution
+        * `n_features` number of features in the convolution layer at the highest resolution (first block)
+        * `max_features` maximum number of features in any generator block
+        """
+        super().__init__()
+
+        # Layer to convert RGB image to a feature map with `n_features` number of features.
+        self.from_rgb = nn.Sequential(
+            EqualizedConv2d(3, n_features, 1),
+            nn.LeakyReLU(0.2, True),
+        )
+
+        # Calculate the number of features for each block.
+        #
+        # Something like `[64, 128, 256, 512, 512, 512]`.
+        features = [min(max_features, n_features * (2 ** i)) for i in range(log_resolution - 1)]
+        # Number of [discirminator blocks](#discriminator_block)
+        n_blocks = len(features) - 1
+        # Discriminator blocks
+        blocks = [DiscriminatorBlock(features[i], features[i + 1]) for i in range(n_blocks)]
+        self.blocks = nn.Sequential(*blocks)
+
+        # [Mini-batch Standard Deviation](#mini_batch_std_dev)
+        self.std_dev = MiniBatchStdDev()
+        # Number of features after adding the standard deviations map
+        final_features = features[-1] + 1
+        # Final $3 \times 3$ convolution layer
+        self.conv = EqualizedConv2d(final_features, final_features, 3)
+        # Final linear layer to get the classification
+        self.final = EqualizedLinear(2 * 2 * final_features, 1)
+
+    def forward(self, x: torch.Tensor):
+        """
+        * `x` is the input image of shape `[batch_size, 3, height, width]`
+        """
+
+        # Try to normalize the image (this is totally optional, but sped up the early training a little)
+        x = x - 0.5
+        # Convert from RGB
+        x = self.from_rgb(x)
+        # Run through the [discriminator blocks](#discriminator_block)
+        x = self.blocks(x)
+
+        # Calculate and append [mini-batch standard deviation](#mini_batch_std_dev)
+        x = self.std_dev(x)
+        # $3 \times 3$ convolution
+        x = self.conv(x)
+        # Flatten
+        x = x.reshape(x.shape[0], -1)
+        # Return the classification score
+        return self.final(x)
+
+
+class DiscriminatorBlock(nn.Module):
+    """
+    <a id="discriminator_black"></a>
+    ### Discriminator Block
+
+    ![Discriminator block](discriminator_block.svg)
+
+    Discriminator block consists of two $3 \times 3$ convolutions with a residual connection.
+    """
+
+    def __init__(self, in_features, out_features):
+        """
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        """
+        super().__init__()
+        # Down-sampling and $1 \times 1$ convolution layer for the residual connection
+        self.residual = nn.Sequential(DownSample(),
+                                      EqualizedConv2d(in_features, out_features, kernel_size=1))
+
+        # Two $3 \times 3$ convolutions
+        self.block = nn.Sequential(
+            EqualizedConv2d(in_features, in_features, kernel_size=3, padding=1),
+            nn.LeakyReLU(0.2, True),
+            EqualizedConv2d(in_features, out_features, kernel_size=3, padding=1),
+            nn.LeakyReLU(0.2, True),
+        )
+
+        # Down-sampling layer
+        self.down_sample = DownSample()
+
+        # Scaling factor $\frac{1}{\sqrt 2}$ after adding the residual
+        self.scale = 1 / math.sqrt(2)
+
+    def forward(self, x):
+        # Get the residual connection
+        residual = self.residual(x)
+
+        # Convolutions
+        x = self.block(x)
+        # Down-sample
+        x = self.down_sample(x)
+
+        # Add the residual and scale
+        return (x + residual) * self.scale
+
+
+class MiniBatchStdDev(nn.Module):
+    """
+    <a id="mini_batch_std_dev"></a>
+
+    ### Mini-batch Standard Deviation
+
+    Mini-batch standard deviation calculates the standard deviation
+    across a mini-batch (or a subgroups within the mini-batch)
+    for each feature in the feature map. Then it takes the mean of all
+    the standard deviations and appends it to the feature map as one extra feature.
+    """
+
+    def __init__(self, group_size: int = 4):
+        """
+        * `group_size` is the number of samples to calculate standard deviation across.
+        """
+        super().__init__()
+        self.group_size = group_size
+
+    def forward(self, x: torch.Tensor):
+        """
+        * `x` is the feature map
+        """
+        # Check if the batch size is divisible by the group size
+        assert x.shape[0] % self.group_size == 0
+        # Split the samples into groups of `group_size`, we flatten the feature map to a single dimension
+        # since we want to calculate the standard deviation for each feature.
+        grouped = x.view(self.group_size, -1)
+        # Calculate the standard deviation for each feature among `group_size` samples
+        # $$\mu_{i} = \frac{1}{N} \sum_g x_{g,i} \\
+        #   \sigma_{i} = \sqrt{\frac{1}{N} \sum_g (x_{g,i} - \mu_i)^2  + \epsilon}$$
+        std = torch.sqrt(grouped.var(dim=0) + 1e-8)
+        # Get the mean standard deviation
+        std = std.mean().view(1, 1, 1, 1)
+        # Expand the standard deviation to append to the feature map
+        b, _, h, w = x.shape
+        std = std.expand(b, -1, h, w)
+        # Append (concatenate) the standard deviations to the feature map
+        return torch.cat([x, std], dim=1)
+
+
+class DownSample(nn.Module):
+    """
+    <a id="down_sample"></a>
+    ### Down-sample
+
+    The down-sample operation [smoothens](#smooth) each feature channel and
+     scale $2 \times$ using bilinear interpolation.
+    This is based on the paper
+     [Making Convolutional Networks Shift-Invariant Again](https://arxiv.org/abs/1904.11486).
+    """
+
+    def __init__(self):
+        super().__init__()
+        # Smoothing layer
+        self.smooth = Smooth()
+
+    def forward(self, x: torch.Tensor):
+        # Smoothing or blurring
+        x = self.smooth(x)
+        # Scaled down
+        return F.interpolate(x, (x.shape[2] // 2, x.shape[3] // 2), mode='bilinear', align_corners=False)
+
+
+class UpSample(nn.Module):
+    """
+    <a id="up_sample"></a>
+    ### Up-sample
+
+    The up-sample operation scales the image up by $2 \times$ and [smoothens](#smooth) each feature channel.
+    This is based on the paper
+     [Making Convolutional Networks Shift-Invariant Again](https://arxiv.org/abs/1904.11486).
+    """
+
+    def __init__(self):
+        super().__init__()
+        # Up-sampling layer
+        self.up_sample = nn.Upsample(scale_factor=2, mode='bilinear', align_corners=False)
+        # Smoothing layer
+        self.smooth = Smooth()
+
+    def forward(self, x: torch.Tensor):
+        # Up-sample and smoothen
+        return self.smooth(self.up_sample(x))
+
+
+class Smooth(nn.Module):
+    """
+    <a id="smooth"></a>
+    ### Smoothing Layer
+
+    This layer blurs each channel
+    """
+
+    def __init__(self):
+        super().__init__()
+        # Blurring kernel
+        kernel = [[1, 2, 1],
+                  [2, 4, 2],
+                  [1, 2, 1]]
+        # Convert the kernel to a PyTorch tensor
+        kernel = torch.tensor([[kernel]], dtype=torch.float)
+        # Normalize the kernel
+        kernel /= kernel.sum()
+        # Save kernel as a fixed parameter (no gradient updates)
+        self.kernel = nn.Parameter(kernel, requires_grad=False)
+        # Padding layer
+        self.pad = nn.ReplicationPad2d(1)
+
+    def forward(self, x: torch.Tensor):
+        # Get shape of the input feature map
+        b, c, h, w = x.shape
+        # Reshape for smoothening
+        x = x.view(-1, 1, h, w)
+
+        # Add padding
+        x = self.pad(x)
+
+        # Smoothen (blur) with the kernel
+        x = F.conv2d(x, self.kernel)
+
+        # Reshape and return
+        return x.view(b, c, h, w)
+
+
+class EqualizedLinear(nn.Module):
+    """
+    <a id="equalized_linear"></a>
+    ## Learning-rate Equalized Linear Layer
+
+    This uses [learning-rate equalized weights]($equalized_weights) for a linear layer.
+    """
+
+    def __init__(self, in_features: int, out_features: int, bias: float = 0.):
+        """
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        * `bias` is the bias initialization constant
+        """
+
+        super().__init__()
+        # [Learning-rate equalized weights]($equalized_weights)
+        self.weight = EqualizedWeight([out_features, in_features])
+        # Bias
+        self.bias = nn.Parameter(torch.ones(out_features) * bias)
+
+    def forward(self, x: torch.Tensor):
+        # Linear transformation
+        return F.linear(x, self.weight(), bias=self.bias)
+
+
+class EqualizedConv2d(nn.Module):
+    """
+    <a id="equalized_conv2d"></a>
+    ## Learning-rate Equalized 2D Convolution Layer
+
+    This uses [learning-rate equalized weights]($equalized_weights) for a convolution layer.
+    """
+
+    def __init__(self, in_features: int, out_features: int,
+                 kernel_size: int, padding: int = 0):
+        """
+        * `in_features` is the number of features in the input feature map
+        * `out_features` is the number of features in the output feature map
+        * `kernel_size` is the size of the convolution kernel
+        * `padding` is the padding to be added on both sides of each size dimension
+        """
+        super().__init__()
+        # Padding size
+        self.padding = padding
+        # [Learning-rate equalized weights]($equalized_weights)
+        self.weight = EqualizedWeight([out_features, in_features, kernel_size, kernel_size])
+        # Bias
+        self.bias = nn.Parameter(torch.ones(out_features))
+
+    def forward(self, x: torch.Tensor):
+        # Convolution
+        return F.conv2d(x, self.weight(), bias=self.bias, padding=self.padding)
+
+
+class EqualizedWeight(nn.Module):
+    """
+    <a id="equalized_weight"></a>
+    ## Learning-rate Equalized Weights Parameter
+
+    This is based on equalized learning rate introduced in the Progressive GAN paper.
+    Instead of initializing weights at $\mathcal{N}(0,c)$ they initialize weights
+    to $\mathcal{N}(0, 1)$ and then multiply them by $c$ when using it.
+    $$w_i = c \hat{w}_i$$
+
+    The gradients on stored parameters $\hat{w}$ get multiplied by $c$ but this doesn't have
+    an affect since optimizers such as Adam normalize them by a running mean of the squared gradients.
+
+    The optimizer updates on $\hat{w}$ are proportionate to the learning rate $\lambda$.
+    But the effective weights $w$ get updated proportionately to $c \lambda$.
+    Without equalized learning rate, the effective weights will get updated proportionately to just $\lambda$.
+
+    So we are effectively scaling the learning rate by $c$ for these weight parameters.
+    """
+
+    def __init__(self, shape: List[int]):
+        """
+        * `shape` is the shape of the weight parameter
+        """
+        super().__init__()
+
+        # He initialization constant
+        self.c = 1 / math.sqrt(np.prod(shape[1:]))
+        # Initialize the weights with $\mathcal{N}(0, 1)$
+        self.weight = nn.Parameter(torch.randn(shape))
+        # Weight multiplication coefficient
+
+    def forward(self):
+        # Multiply the weights by $c$ and return
+        return self.weight * self.c
+
+
+class GradientPenalty(nn.Module):
+    """
+    <a id="gradient_penalty"></a>
+    ## Gradient Penalty
+
+    This is the $R_1$ regularization penality from the paper
+    [Which Training Methods for GANs do actually Converge?](https://arxiv.org/abs/1801.04406).
+
+    $$R_1(\psi) = \frac{\gamma}{2} \mathbb{E}_{p_\mathcal{D}(x)}
+    \Big[\Vert \nabla_x D_\psi(x)^2 \Vert\Big]$$
+
+    That is we try to reduce the L2 norm of gradients of the discriminator with
+    respect to images, for real images ($P_\mathcal{D}$).
+    """
+
+    def forward(self, x: torch.Tensor, d: torch.Tensor):
+        """
+        * `x` is $x \sim \mathcal{D}$
+        * `d` is $D(x)$
+        """
+
+        # Get batch size
+        batch_size = x.shape[0]
+
+        # Calculate gradients of $D(x)$ with respect to $x$.
+        # `grad_outputs` is set to $1$ since we want the gradients of $D(x)$,
+        # and we need to create and retain graph since we have to compute gradients
+        # with respect to weight on this loss.
+        gradients, *_ = torch.autograd.grad(outputs=d,
+                                            inputs=x,
+                                            grad_outputs=d.new_ones(d.shape),
+                                            create_graph=True)
+
+        # Reshape gradients to calculate the norm
+        gradients = gradients.reshape(batch_size, -1)
+        # Calculate the norm $\Vert \nabla_{x} D(x)^2 \Vert$
+        norm = gradients.norm(2, dim=-1)
+        # Return the loss $\Vert \nabla_x D_\psi(x)^2 \Vert$
+        return torch.mean(norm ** 2)
+
+
+class PathLengthPenalty(nn.Module):
+    """
+    <a id="path_length_penalty"></a>
+    ## Path Length Penalty
+
+    This regularization encourages a fixed-size step in $w$ to result in a fixed-magnitude
+    change in the image.
+
+    $$\mathbb{E}_{w \sim f(z), y \sim \mathcal{N}(0, \mathbf{I})}
+      \Big(\Vert \mathbf{J}^\top_{w} y \Vert_2 - a \Big)^2$$
+
+    where $\mathbf{J}_w$ is the Jacobian
+    $\mathbf{J}_w = \frac{\partial g}{\partial w}$,
+    $w$ are sampled from $w \in \mathcal{W}$ from the mapping network, and
+    $y$ are images with noise $\mathcal{N}(0, \mathbf{I})$.
+
+    $a$ is the exponential moving average of $\Vert \mathbf{J}^\top_{w} y \Vert_2$
+    as the training progresses.
+
+    $\mathbf{J}^\top_{w} y$ is calculated without explicitly calculating the Jacobian using
+    $$\mathbf{J}^\top_{w} y = \nabla_w \big(g(w) \cdot y \big)$$
+    """
+
+    def __init__(self, beta: float):
+        """
+        * `beta` is the constant $\beta$ used to calculate the exponential moving average $a$
+        """
+        super().__init__()
+
+        # $\beta$
+        self.beta = beta
+        # Number of steps calculated $N$
+        self.steps = nn.Parameter(torch.tensor(0.), requires_grad=False)
+        # Exponential sum of $\mathbf{J}^\top_{w} y$
+        # $$\sum^N_{i=1} \beta^{(N - i)}[\mathbf{J}^\top_{w} y]_i$$
+        # where $[\mathbf{J}^\top_{w} y]_i$ is the value of it at $i$-th step of training
+        self.exp_sum_a = nn.Parameter(torch.tensor(0.), requires_grad=False)
+
+    def forward(self, w: torch.Tensor, x: torch.Tensor):
+        """
+        * `w` is the batch of $w$ of shape `[batch_size, d_latent]`
+        * `x` are the generated images of shape `[batch_size, 3, height, width]`
+        """
+
+        # Get the device
+        device = x.device
+        # Get number of pixels
+        image_size = x.shape[2] * x.shape[3]
+        # Calculate $y \in \mathcal{N}(0, \mathbf{I})$
+        y = torch.randn(x.shape, device=device)
+        # Calculate $\big(g(w) \cdot y \big)$ and normalize by the square root of image size.
+        # This is scaling is not mentioned in the paper but was present in
+        # [their implementation](https://github.com/NVlabs/stylegan2/blob/master/training/loss.py#L167).
+        output = (x * y).sum() / math.sqrt(image_size)
+
+        # Calculate gradients to get $\mathbf{J}^\top_{w} y$
+        gradients, *_ = torch.autograd.grad(outputs=output,
+                                            inputs=w,
+                                            grad_outputs=torch.ones(output.shape, device=device),
+                                            create_graph=True)
+
+        # Calculate L2-norm of $\mathbf{J}^\top_{w} y$
+        norm = (gradients ** 2).sum(dim=2).mean(dim=1).sqrt()
+
+        # Regularize after first step
+        if self.steps > 0:
+            # Calculate $a$
+            # $$\frac{1}{1 - \beta^N} \sum^N_{i=1} \beta^{(N - i)}[\mathbf{J}^\top_{w} y]_i$$
+            a = self.exp_sum_a / (1 - self.beta ** self.steps)
+            # Calculate the penalty
+            # $$\mathbb{E}_{w \sim f(z), y \sim \mathcal{N}(0, \mathbf{I})}
+            # \Big(\Vert \mathbf{J}^\top_{w} y \Vert_2 - a \Big)^2$$
+            loss = torch.mean((norm - a) ** 2)
+        else:
+            # Return a dummy loss if we can't calculate $a$
+            loss = norm.new_tensor(0)
+
+        # Calculate the mean of $\Vert \mathbf{J}^\top_{w} y \Vert_2$
+        mean = norm.mean().detach()
+        # Update exponential sum
+        self.exp_sum_a.mul_(self.beta).add_(mean, alpha=1 - self.beta)
+        # Increment $N$
+        self.steps.add_(1.)
+
+        # Return the penalty
+        return loss
diff --git a/labml_nn/gan/stylegan/experiment.py b/labml_nn/gan/stylegan/experiment.py
new file mode 100644
index 00000000..4eec2d8a
--- /dev/null
+++ b/labml_nn/gan/stylegan/experiment.py
@@ -0,0 +1,467 @@
+"""
+---
+title: Style GAN 2 Model Training
+summary: >
+ An annotated PyTorch implementation of StyleGAN2 model training code.
+---
+
+# [Style GAN 2](index.html) Model Training
+
+This is the training code for [Style GAN 2](index.html) model.
+
+![Generated Images](generated_64.png)
+
+*<small>These are $64 \times 64$ images generated after training for about 80K steps.</small>*
+
+*Our implementation is a minimalistic Style GAN2 model training code.
+Only single GPU training is supported to keep the implementation simple.
+We managed to shrink it to keep it at less than 500 lines of code, including the training loop.*
+
+*Without DDP (distributed data parallel) and multi-gpu training it will not be possible to train the model
+for large resolutions (128+).
+If you want training code with fp16 and DDP take a look at
+[lucidrains/stylegan2-pytorch](https://github.com/lucidrains/stylegan2-pytorch).*
+
+We trained this on [CelebA-HQ dataset](https://github.com/tkarras/progressive_growing_of_gans).
+You can find the download instruction in this
+[discussion on fast.ai](https://forums.fast.ai/t/download-celeba-hq-dataset/45873/3).
+Save the images inside [`data/stylegan` folder](#dataset_path).
+"""
+
+import math
+from pathlib import Path
+from typing import Iterator, Tuple
+
+import torch
+import torch.utils.data
+import torchvision
+from PIL import Image
+
+from labml import tracker, lab, monit, experiment
+from labml.configs import BaseConfigs
+from labml_helpers.device import DeviceConfigs
+from labml_helpers.train_valid import ModeState, hook_model_outputs
+from labml_nn.gan.stylegan import Discriminator, Generator, MappingNetwork, GradientPenalty, PathLengthPenalty
+from labml_nn.gan.wasserstein import DiscriminatorLoss, GeneratorLoss
+from labml_nn.utils import cycle_dataloader
+
+
+class Dataset(torch.utils.data.Dataset):
+    """
+    ## Dataset
+
+    This loads the training dataset and resize it to the give image size.
+    """
+
+    def __init__(self, path: str, image_size: int):
+        """
+        * `path` path to the folder containing the images
+        * `image_size` size of the image
+        """
+        super().__init__()
+
+        # Get the paths of all `jpg` files
+        self.paths = [p for p in Path(path).glob(f'**/*.jpg')]
+
+        # Transformation
+        self.transform = torchvision.transforms.Compose([
+            # Resize the image
+            torchvision.transforms.Resize(image_size),
+            # Convert to PyTorch tensor
+            torchvision.transforms.ToTensor(),
+        ])
+
+    def __len__(self):
+        """Number of images"""
+        return len(self.paths)
+
+    def __getitem__(self, index):
+        """Get the the `index`-th image"""
+        path = self.paths[index]
+        img = Image.open(path)
+        return self.transform(img)
+
+
+class Configs(BaseConfigs):
+    """
+    ## Configurations
+    """
+
+    # Device to train the model on.
+    # [`DeviceConfigs`](https://github.com/lab-ml/helpers/blob/master/labml_helpers/device.py)
+    #  picks up an available CUDA device or defaults to CPU.
+    device: torch.device = DeviceConfigs()
+
+    # [StyleGAN2 Discriminator](index.html#discriminator)
+    discriminator: Discriminator
+    # [StyleGAN2 Generator](index.html#generator)
+    generator: Generator
+    # [Mapping network](index.html#mapping_network)
+    mapping_network: MappingNetwork
+
+    # Discriminator and generator loss functions.
+    # We use [Wasserstein loss](../wasserstein/index.html)
+    discriminator_loss: DiscriminatorLoss
+    generator_loss: GeneratorLoss
+
+    # Optimizers
+    generator_optimizer: torch.optim.Adam
+    discriminator_optimizer: torch.optim.Adam
+    mapping_network_optimizer: torch.optim.Adam
+
+    # [Gradient Penalty Regularization Loss](index.html#gradient_penalty)
+    gradient_penalty = GradientPenalty()
+    # Gradient penalty coefficient $\gamma$
+    gradient_penalty_coefficient: float = 10.
+
+    # [Path length penalty](index.html#path_length_penalty)
+    path_length_penalty: PathLengthPenalty
+
+    # Data loader
+    loader: Iterator
+
+    # Batch size
+    batch_size: int = 32
+    # Dimensionality of $z$ and $w$
+    d_latent: int = 512
+    # Height/width of the image
+    image_size: int = 32
+    # Number of layers in the mapping network
+    mapping_network_layers: int = 8
+    # Generator & Discriminator learning rate
+    learning_rate: float = 1e-3
+    # Mapping network learning rate ($100 \times$ lower than the others)
+    mapping_network_learning_rate: float = 1e-5
+    # Number of steps to accumulate gradients on. Use this to increase the effective batch size.
+    gradient_accumulate_steps: int = 1
+    # $\beta_1$ and $\beta_2$ for Adam optimizer
+    adam_betas: Tuple[float, float] = (0.0, 0.99)
+    # Probability of mixing styles
+    style_mixing_prob: float = 0.9
+
+    # Total number of training steps
+    training_steps: int = 150_000
+
+    # Number of blocks in the generator (calculated based on image resolution)
+    n_gen_blocks: int
+
+    # ### Lazy regularization
+    # Instead of calculating the regularization losses, the paper proposes lazy regularization
+    # where the regularization terms are calculated once in a while.
+    # This improves the training efficiency a lot.
+
+    # The interval at which to compute gradient penalty
+    lazy_gradient_penalty_interval: int = 4
+    # Path length penalty calculation interval
+    lazy_path_penalty_interval: int = 32
+    # Skip calculating path length penalty during the initial phase of training
+    lazy_path_penalty_after: int = 5_000
+
+    # How often to log generated images
+    log_generated_interval: int = 500
+    # How often to save model checkpoints
+    save_checkpoint_interval: int = 2_000
+
+    # Training mode state for logging activations
+    mode: ModeState
+    # Whether to log model layer outputs
+    log_layer_outputs: bool = False
+
+    # <a id="dataset_path"></a>
+    # We trained this on [CelebA-HQ dataset](https://github.com/tkarras/progressive_growing_of_gans).
+    # You can find the download instruction in this
+    # [discussion on fast.ai](https://forums.fast.ai/t/download-celeba-hq-dataset/45873/3).
+    # Save the images inside `data/stylegan` folder.
+    dataset_path: str = str(lab.get_data_path() / 'stylegan2')
+
+    def init(self):
+        """
+        ### Initialize
+        """
+        # Create dataset
+        dataset = Dataset(self.dataset_path, self.image_size)
+        # Create data loader
+        dataloader = torch.utils.data.DataLoader(dataset, batch_size=self.batch_size, num_workers=32,
+                                                 shuffle=True, drop_last=True, pin_memory=True)
+        # Continuous [cyclic loader](../../utils.html#cycle_dataloader)
+        self.loader = cycle_dataloader(dataloader)
+
+        # $\log_2$ of image resolution
+        log_resolution = int(math.log2(self.image_size))
+
+        # Create discriminator and generator
+        self.discriminator = Discriminator(log_resolution).to(self.device)
+        self.generator = Generator(log_resolution, self.d_latent).to(self.device)
+        # Get number of generator blocks for creating style and noise inputs
+        self.n_gen_blocks = self.generator.n_blocks
+        # Create mapping network
+        self.mapping_network = MappingNetwork(self.d_latent, self.mapping_network_layers).to(self.device)
+        # Create path length penalty loss
+        self.path_length_penalty = PathLengthPenalty(0.99).to(self.device)
+
+        # Add model hooks to monitor layer outputs
+        if self.log_layer_outputs:
+            hook_model_outputs(self.mode, self.discriminator, 'discriminator')
+            hook_model_outputs(self.mode, self.generator, 'generator')
+            hook_model_outputs(self.mode, self.mapping_network, 'mapping_network')
+
+        # Discriminator and generator losses
+        self.discriminator_loss = DiscriminatorLoss().to(self.device)
+        self.generator_loss = GeneratorLoss().to(self.device)
+
+        # Create optimizers
+        self.discriminator_optimizer = torch.optim.Adam(
+            self.discriminator.parameters(),
+            lr=self.learning_rate, betas=self.adam_betas
+        )
+        self.generator_optimizer = torch.optim.Adam(
+            self.generator.parameters(),
+            lr=self.learning_rate, betas=self.adam_betas
+        )
+        self.mapping_network_optimizer = torch.optim.Adam(
+            self.mapping_network.parameters(),
+            lr=self.mapping_network_learning_rate, betas=self.adam_betas
+        )
+
+        # Set tracker configurations
+        tracker.set_image("generated", True)
+
+    def get_w(self, batch_size: int):
+        """
+        ### Sample $w$
+
+        This samples $z$ randomly and get $w$ from the mapping network.
+
+        We also apply style mixing sometimes where we generate two latent variables
+        $z_1$ and $z_2$ and get corresponding $w_1$ and $w_2$.
+        Then we randomly sample a cross-over point and apply $w_1$ to
+        the generator blocks before the cross-over point and
+        $w_2$ to the blocks after.
+        """
+
+        # Mix styles
+        if torch.rand(()).item() < self.style_mixing_prob:
+            # Random cross-over point
+            cross_over_point = int(torch.rand(()).item() * self.n_gen_blocks)
+            # Sample $z_1$ and $z_2$
+            z2 = torch.randn(batch_size, self.d_latent).to(self.device)
+            z1 = torch.randn(batch_size, self.d_latent).to(self.device)
+            # Get $w_1$ and $w_2$
+            w1 = self.mapping_network(z1)
+            w2 = self.mapping_network(z2)
+            # Expand $w_1$ and $w_2$ for the generator blocks and concatenate
+            w1 = w1[None, :, :].expand(cross_over_point, -1, -1)
+            w2 = w2[None, :, :].expand(self.n_gen_blocks - cross_over_point, -1, -1)
+            return torch.cat((w1, w2), dim=0)
+        # Without mixing
+        else:
+            # Sample $z$ and $z$
+            z = torch.randn(batch_size, self.d_latent).to(self.device)
+            # Get $w$ and $w$
+            w = self.mapping_network(z)
+            # Expand $w$ for the generator blocks
+            return w[None, :, :].expand(self.n_gen_blocks, -1, -1)
+
+    def get_noise(self, batch_size: int):
+        """
+        ### Generate noise
+
+        This generates noise for each [generator block](index.html#generator_block)
+        """
+        # List to store noise
+        noise = []
+        # Noise resolution starts from $4$
+        resolution = 4
+
+        # Generate noise for each generator block
+        for i in range(self.n_gen_blocks):
+            # The first block has only one $3 \times 3$ convolution
+            if i == 0:
+                n1 = None
+            # Generate noise to add after the first convolution layer
+            else:
+                n1 = torch.randn(batch_size, 1, resolution, resolution, device=self.device)
+            # Generate noise to add after the second convolution layer
+            n2 = torch.randn(batch_size, 1, resolution, resolution, device=self.device)
+
+            # Add noise tensors to the list
+            noise.append((n1, n2))
+
+            # Next block has $2 \times$ resolution
+            resolution *= 2
+
+        # Return noise tensors
+        return noise
+
+    def generate_images(self, batch_size: int):
+        """
+        ### Generate images
+
+        This generate images using the generator
+        """
+
+        # Get $w$
+        w = self.get_w(batch_size)
+        # Get noise
+        noise = self.get_noise(batch_size)
+
+        # Generate images
+        images = self.generator(w, noise)
+
+        # Return images and $w$
+        return images, w
+
+    def step(self, idx: int):
+        """
+        ### Training Step
+        """
+
+        # Train the discriminator
+        with monit.section('Discriminator'):
+            # Reset gradients
+            self.discriminator_optimizer.zero_grad()
+
+            # Accumulate gradients for `gradient_accumulate_steps`
+            for i in range(self.gradient_accumulate_steps):
+                # Update `mode`. Set whether to log activation
+                with self.mode.update(is_log_activations=(idx + 1) % self.log_generated_interval == 0):
+                    # Sample images from generator
+                    generated_images, _ = self.generate_images(self.batch_size)
+                    # Discriminator classification for generated images
+                    fake_output = self.discriminator(generated_images.detach())
+
+                    # Get real images from the data loader
+                    real_images = next(self.loader).to(self.device)
+                    # We need to calculate gradients w.r.t. real images for gradient penalty
+                    if (idx + 1) % self.lazy_gradient_penalty_interval == 0:
+                        real_images.requires_grad_()
+                    # Discriminator classification for real images
+                    real_output = self.discriminator(real_images)
+
+                    # Get discriminator loss
+                    real_loss, fake_loss = self.discriminator_loss(real_output, fake_output)
+                    disc_loss = real_loss + fake_loss
+
+                    # Add gradient penalty
+                    if (idx + 1) % self.lazy_gradient_penalty_interval == 0:
+                        # Calculate and log gradient penalty
+                        gp = self.gradient_penalty(real_images, real_output)
+                        tracker.add('loss.gp', gp)
+                        # Multiply by coefficient and add gradient penalty
+                        disc_loss = disc_loss + 0.5 * self.gradient_penalty_coefficient * gp * self.lazy_gradient_penalty_interval
+
+                    # Compute gradients
+                    disc_loss.backward()
+
+                    # Log discriminator loss
+                    tracker.add('loss.discriminator', disc_loss)
+
+            if (idx + 1) % self.log_generated_interval == 0:
+                # Log discriminator model parameters occasionally
+                tracker.add('discriminator', self.discriminator)
+
+            # Clip gradients for stabilization
+            torch.nn.utils.clip_grad_norm_(self.discriminator.parameters(), max_norm=1.0)
+            # Take optimizer step
+            self.discriminator_optimizer.step()
+
+        # Train the generator
+        with monit.section('Generator'):
+            # Reset gradients
+            self.generator_optimizer.zero_grad()
+            self.mapping_network_optimizer.zero_grad()
+
+            # Accumulate gradients for `gradient_accumulate_steps`
+            for i in range(self.gradient_accumulate_steps):
+                # Sample images from generator
+                generated_images, w = self.generate_images(self.batch_size)
+                # Discriminator classification for generated images
+                fake_output = self.discriminator(generated_images)
+
+                # Get generator loss
+                gen_loss = self.generator_loss(fake_output)
+
+                # Add path length penalty
+                if idx > self.lazy_path_penalty_after and (idx + 1) % self.lazy_path_penalty_interval == 0:
+                    # Calculate path length penalty
+                    plp = self.path_length_penalty(w, generated_images)
+                    # Ignore if `nan`
+                    if not torch.isnan(plp):
+                        tracker.add('loss.plp', plp)
+                        gen_loss = gen_loss + plp
+
+                # Calculate gradients
+                gen_loss.backward()
+
+                # Log generator loss
+                tracker.add('loss.generator', gen_loss)
+
+            if (idx + 1) % self.log_generated_interval == 0:
+                # Log discriminator model parameters occasionally
+                tracker.add('generator', self.generator)
+                tracker.add('mapping_network', self.mapping_network)
+
+            # Clip gradients for stabilization
+            torch.nn.utils.clip_grad_norm_(self.generator.parameters(), max_norm=1.0)
+            torch.nn.utils.clip_grad_norm_(self.mapping_network.parameters(), max_norm=1.0)
+
+            # Take optimizer step
+            self.generator_optimizer.step()
+            self.mapping_network_optimizer.step()
+
+        # Log generated images
+        if (idx + 1) % self.log_generated_interval == 0:
+            tracker.add('generated', torch.cat([generated_images[:6], real_images[:3]], dim=0))
+        # Save model checkpoints
+        if (idx + 1) % self.save_checkpoint_interval == 0:
+            experiment.save_checkpoint()
+
+        # Flush tracker
+        tracker.save()
+
+    def train(self):
+        """
+        ## Train model
+        """
+
+        # Loop for `training_steps`
+        for i in monit.loop(self.training_steps):
+            # Take a training step
+            self.step(i)
+            #
+            if (i + 1) % self.log_generated_interval == 0:
+                tracker.new_line()
+
+
+def main():
+    """
+    ### Train StyleGAN2
+    """
+
+    # Create an experiment
+    experiment.create(name='stylegan2')
+    # Create configurations object
+    configs = Configs()
+
+    # Set configurations and override some
+    experiment.configs(configs, {
+        'device.cuda_device': 0,
+        'image_size': 64,
+        'log_generated_interval': 200
+    })
+
+    # Initialize
+    configs.init()
+    # Set models for saving and loading
+    experiment.add_pytorch_models(mapping_network=configs.mapping_network,
+                                  generator=configs.generator,
+                                  discriminator=configs.discriminator)
+
+    # Start the experiment
+    with experiment.start():
+        # Run the training loop
+        configs.train()
+
+#
+if __name__ == '__main__':
+    main()
diff --git a/labml_nn/utils.py b/labml_nn/utils.py
index 1734c974..5267dc5e 100644
--- a/labml_nn/utils.py
+++ b/labml_nn/utils.py
@@ -14,6 +14,20 @@ from labml_helpers.module import M, TypedModuleList
 
 def clone_module_list(module: M, n: int) -> TypedModuleList[M]:
     """
-    ## Make a `nn.ModuleList` with clones of a given layer
+    ## Clone Module
+
+    Make a `nn.ModuleList` with clones of a given module
     """
     return TypedModuleList([copy.deepcopy(module) for _ in range(n)])
+
+
+def cycle_dataloader(data_loader):
+    """
+    <a id="cycle_dataloader"></a>
+    ## Cycle Data Loader
+
+    Infinite loader that recycles the data loader after each epoch
+    """
+    while True:
+        for batch in data_loader:
+            yield batch
diff --git a/requirements.txt b/requirements.txt
index 6fdc75b3..579efdb2 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -7,3 +7,4 @@ matplotlib>=3.0.3
 einops>=0.3.0
 gym[atari]
 opencv-python
+Pillow>=6.2.1
diff --git a/utils/diagrams.py b/utils/diagrams.py
new file mode 100644
index 00000000..07605158
--- /dev/null
+++ b/utils/diagrams.py
@@ -0,0 +1,260 @@
+import shutil
+from pathlib import Path
+from typing import List
+from xml.dom import minidom
+
+from labml import monit
+
+HOME = Path('.').absolute()
+
+STYLES = """
+.black-stroke {
+    stroke: #aaa;
+}
+
+rect.black-stroke {
+    stroke: #444;
+}
+
+.black-fill {
+    fill: #ddd;
+}
+
+.white-fill {
+    fill: #333;
+}
+
+.blue-stroke {
+    stroke: #5b8fab;
+}
+
+.blue-fill {
+    fill: #356782;
+}
+
+.yellow-stroke {
+    stroke: #bbab52;
+}
+
+.yellow-fill {
+    fill: #a7942b;
+}
+
+.grey-stroke {
+    stroke: #484d5a;
+}
+
+.grey-fill {
+    fill: #2e323c;
+}
+
+.red-stroke {
+    stroke: #bb3232;
+}
+
+.red-fill {
+    fill: #901c1c;
+}
+
+.orange-stroke {
+    stroke: #a5753f;
+}
+
+.orange-fill {
+    fill: #82531e;
+}
+
+.purple-stroke {
+    stroke: #a556a5;
+}
+
+.purple-fill {
+    fill: #8a308a;
+}
+
+.green-stroke {
+    stroke: #80cc92;
+}
+
+.green-fill {
+    fill: #499e5d;
+}
+
+switch foreignObject div div div {
+    color: #ddd !important;
+}
+
+switch foreignObject div div div span {
+    color: #ddd !important;
+}
+
+.has-background {
+    background-color: #1d2127 !important;
+}
+"""
+
+STROKES = {
+    '#000000': 'black',
+    '#6c8ebf': 'blue',
+    '#d6b656': 'yellow',
+    '#666666': 'grey',
+    '#b85450': 'red',
+    '#d79b00': 'orange',
+    '#9673a6': 'purple',
+    '#82b366': 'green',
+}
+
+FILLS = {
+    '#000000': 'black',
+    '#ffffff': 'white',
+    '#dae8fc': 'blue',
+    '#fff2cc': 'yellow',
+    '#f5f5f5': 'grey',
+    '#f8cecc': 'red',
+    '#ffe6cc': 'orange',
+    '#e1d5e7': 'purple',
+    '#d5e8d4': 'green',
+}
+
+
+def clear_switches(doc: minidom.Document):
+    switches = doc.getElementsByTagName('switch')
+    for s in switches:
+        children = s.childNodes
+        assert len(children) == 2
+        if children[0].tagName == 'g' and 'requiredFeatures' in children[0].attributes:
+            s.parentNode.removeChild(s)
+            s.unlink()
+            continue
+        assert children[0].tagName == 'foreignObject'
+        assert children[1].tagName == 'text'
+        c = children[1]
+        s.removeChild(c)
+        s.parentNode.insertBefore(c, s)
+        s.parentNode.removeChild(s)
+
+
+def add_class(node: minidom.Node, class_name: str):
+    if 'class' not in node.attributes:
+        node.attributes['class'] = class_name
+        return
+
+    node.attributes['class'] = node.attributes['class'].value + f' {class_name}'
+
+
+def add_bg_classes(nodes: List[minidom.Node]):
+    for node in nodes:
+        if 'style' in node.attributes:
+            s = node.attributes['style'].value
+            if s.count('background-color'):
+                add_class(node, 'has-background')
+
+
+def add_stroke_classes(nodes: List[minidom.Node]):
+    for node in nodes:
+        if 'stroke' in node.attributes:
+            stroke = node.attributes['stroke'].value
+            if stroke not in STROKES:
+                continue
+
+            node.removeAttribute('stroke')
+            add_class(node, f'{STROKES[stroke]}-stroke')
+
+
+def add_fill_classes(nodes: List[minidom.Node]):
+    for node in nodes:
+        if 'fill' in node.attributes:
+            fill = node.attributes['fill'].value
+            if fill not in FILLS:
+                continue
+
+            node.removeAttribute('fill')
+            add_class(node, f'{FILLS[fill]}-fill')
+
+
+def add_classes(doc: minidom.Document):
+    paths = doc.getElementsByTagName('path')
+    add_stroke_classes(paths)
+    add_fill_classes(paths)
+
+    rects = doc.getElementsByTagName('rect')
+    add_stroke_classes(rects)
+    add_fill_classes(rects)
+
+    ellipse = doc.getElementsByTagName('ellipse')
+    add_stroke_classes(ellipse)
+    add_fill_classes(ellipse)
+
+    text = doc.getElementsByTagName('text')
+    add_fill_classes(text)
+
+    div = doc.getElementsByTagName('div')
+    add_bg_classes(div)
+
+    span = doc.getElementsByTagName('span')
+    add_bg_classes(span)
+
+
+def parse(source: Path, dest: Path):
+    doc: minidom.Document = minidom.parse(str(source))
+
+    svg = doc.getElementsByTagName('svg')
+
+    assert len(svg) == 1
+    svg = svg[0]
+
+    if 'content' in svg.attributes:
+        svg.removeAttribute('content')
+    # svg.attributes['height'] = str(int(svg.attributes['height'].value[:-2]) + 30) + 'px'
+    # svg.attributes['width'] = str(int(svg.attributes['width'].value[:-2]) + 30) + 'px'
+
+    view_box = svg.attributes['viewBox'].value.split(' ')
+    view_box = [float(v) for v in view_box]
+    view_box[0] -= 10
+    view_box[1] -= 10
+    view_box[2] += 20
+    view_box[3] += 20
+    svg.attributes['viewBox'] = ' '.join([str(v) for v in view_box])
+
+    svg.attributes['style'] = 'background: #1d2127;'  # padding: 10px;'
+
+    # clear_switches(doc)
+
+    style = doc.createElement('style')
+    style.appendChild(doc.createTextNode(STYLES))
+    svg.insertBefore(style, svg.childNodes[0])
+    add_classes(doc)
+
+    with open(str(dest), 'w') as f:
+        doc.writexml(f)
+
+
+def recurse(path: Path):
+    files = []
+    if path.is_file():
+        files.append(path)
+        return files
+
+    for f in path.iterdir():
+        files += recurse(f)
+
+    return files
+
+
+def main():
+    diagrams_path = HOME / 'diagrams'
+    docs_path = HOME / 'docs'
+
+    for p in recurse(diagrams_path):
+        source_path = p
+        p = p.relative_to(diagrams_path)
+        dest_path = docs_path / p
+        if not dest_path.parent.exists():
+            dest_path.parent.mkdir(parents=True)
+
+        with monit.section(str(p)):
+            shutil.copy(str(source_path), str(dest_path))
+
+
+if __name__ == '__main__':
+    main()