LoRA notes

This commit is contained in:
Varuna Jayasiri
2024-08-03 16:59:15 +05:30
parent eb9337e949
commit d4af40b595
9 changed files with 1236 additions and 28 deletions

View File

@ -12,7 +12,7 @@
<meta name="twitter:site" content="@labmlai"/>
<meta name="twitter:creator" content="@labmlai"/>
<meta property="og:url" content="https://nn.labml.ai/RWKV/configs.html"/>
<meta property="og:url" content="https://nn.labml.ai/rwkv/configs.html"/>
<meta property="og:title" content="configs.py"/>
<meta property="og:image" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
<meta property="og:site_name" content="configs.py"/>
@ -23,7 +23,7 @@
<title>configs.py</title>
<link rel="shortcut icon" href="/icon.png"/>
<link rel="stylesheet" href="../pylit.css?v=1">
<link rel="canonical" href="https://nn.labml.ai/RWKV/configs.html"/>
<link rel="canonical" href="https://nn.labml.ai/rwkv/configs.html"/>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/katex.min.css" integrity="sha384-zTROYFVGOfTw7JV7KUu8udsvW2fx4lWOsCEDqhBreBwlHI4ioVRtmIvEThzJHGET" crossorigin="anonymous">
<!-- Global site tag (gtag.js) - Google Analytics -->
@ -47,7 +47,7 @@
<div class='docs'>
<p>
<a class="parent" href="/">home</a>
<a class="parent" href="index.html">RWKV</a>
<a class="parent" href="index.html">rwkv</a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations" target="_blank">
@ -60,7 +60,7 @@
style="max-width:100%;"/></a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/RWKV/configs.py" target="_blank">
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/rwkv/configs.py" target="_blank">
View code on Github</a>
</p>
</div>

View File

@ -12,7 +12,7 @@
<meta name="twitter:site" content="@labmlai"/>
<meta name="twitter:creator" content="@labmlai"/>
<meta property="og:url" content="https://nn.labml.ai/RWKV/experiment.html"/>
<meta property="og:url" content="https://nn.labml.ai/rwkv/experiment.html"/>
<meta property="og:title" content="experiment.py"/>
<meta property="og:image" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
<meta property="og:site_name" content="experiment.py"/>
@ -23,7 +23,7 @@
<title>experiment.py</title>
<link rel="shortcut icon" href="/icon.png"/>
<link rel="stylesheet" href="../pylit.css?v=1">
<link rel="canonical" href="https://nn.labml.ai/RWKV/experiment.html"/>
<link rel="canonical" href="https://nn.labml.ai/rwkv/experiment.html"/>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/katex.min.css" integrity="sha384-zTROYFVGOfTw7JV7KUu8udsvW2fx4lWOsCEDqhBreBwlHI4ioVRtmIvEThzJHGET" crossorigin="anonymous">
<!-- Global site tag (gtag.js) - Google Analytics -->
@ -47,7 +47,7 @@
<div class='docs'>
<p>
<a class="parent" href="/">home</a>
<a class="parent" href="index.html">RWKV</a>
<a class="parent" href="index.html">rwkv</a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations" target="_blank">
@ -60,7 +60,7 @@
style="max-width:100%;"/></a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/RWKV/experiment.py" target="_blank">
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/rwkv/experiment.py" target="_blank">
View code on Github</a>
</p>
</div>
@ -78,10 +78,10 @@
<span class="lineno">3</span>
<span class="lineno">4</span><span class="kn">import</span> <span class="nn">torch</span>
<span class="lineno">5</span><span class="kn">import</span> <span class="nn">torch.nn</span> <span class="k">as</span> <span class="nn">nn</span>
<span class="lineno">6</span><span class="kn">from</span> <span class="nn">labml_nn.RWKV.configs</span> <span class="kn">import</span> <span class="n">RWKVConfigs</span>
<span class="lineno">6</span><span class="kn">from</span> <span class="nn">labml_nn.rwkv.configs</span> <span class="kn">import</span> <span class="n">RWKVConfigs</span>
<span class="lineno">7</span>
<span class="lineno">8</span><span class="kn">from</span> <span class="nn">labml_nn.RWKV</span> <span class="kn">import</span> <span class="n">RWKV</span>
<span class="lineno">9</span><span class="kn">from</span> <span class="nn">labml_nn.RWKV</span> <span class="kn">import</span> <span class="n">TimeMixing</span>
<span class="lineno">8</span><span class="kn">from</span> <span class="nn">labml_nn.rwkv</span> <span class="kn">import</span> <span class="n">RWKV</span>
<span class="lineno">9</span><span class="kn">from</span> <span class="nn">labml_nn.rwkv</span> <span class="kn">import</span> <span class="n">TimeMixing</span>
<span class="lineno">10</span><span class="kn">from</span> <span class="nn">labml</span> <span class="kn">import</span> <span class="n">experiment</span>
<span class="lineno">11</span><span class="kn">from</span> <span class="nn">labml.configs</span> <span class="kn">import</span> <span class="n">option</span>
<span class="lineno">12</span><span class="kn">from</span> <span class="nn">labml_nn.experiments.nlp_autoregression</span> <span class="kn">import</span> <span class="n">NLPAutoRegressionConfigs</span></pre></div>

View File

@ -12,7 +12,7 @@
<meta name="twitter:site" content="@labmlai"/>
<meta name="twitter:creator" content="@labmlai"/>
<meta property="og:url" content="https://nn.labml.ai/RWKV/index.html"/>
<meta property="og:url" content="https://nn.labml.ai/rwkv/index.html"/>
<meta property="og:title" content="Receptance Weighted Key Value (RWKV)"/>
<meta property="og:image" content="https://avatars1.githubusercontent.com/u/64068543?s=400&amp;v=4"/>
<meta property="og:site_name" content="Receptance Weighted Key Value (RWKV)"/>
@ -23,7 +23,7 @@
<title>Receptance Weighted Key Value (RWKV)</title>
<link rel="shortcut icon" href="/icon.png"/>
<link rel="stylesheet" href="../pylit.css?v=1">
<link rel="canonical" href="https://nn.labml.ai/RWKV/index.html"/>
<link rel="canonical" href="https://nn.labml.ai/rwkv/index.html"/>
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/katex@0.13.18/dist/katex.min.css" integrity="sha384-zTROYFVGOfTw7JV7KUu8udsvW2fx4lWOsCEDqhBreBwlHI4ioVRtmIvEThzJHGET" crossorigin="anonymous">
<!-- Global site tag (gtag.js) - Google Analytics -->
@ -47,7 +47,7 @@
<div class='docs'>
<p>
<a class="parent" href="/">home</a>
<a class="parent" href="index.html">RWKV</a>
<a class="parent" href="index.html">rwkv</a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations" target="_blank">
@ -60,7 +60,7 @@
style="max-width:100%;"/></a>
</p>
<p>
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/RWKV/__init__.py" target="_blank">
<a href="https://github.com/labmlai/annotated_deep_learning_paper_implementations/tree/master/labml_nn/rwkv/__init__.py" target="_blank">
View code on Github</a>
</p>
</div>