|
fb2ecb6637
|
capsule net descriptions
|
2021-01-16 20:58:25 +05:30 |
|
|
642c944e1b
|
Update setup.py
|
2021-01-15 11:45:25 +05:30 |
|
|
ec45cd9437
|
typo
|
2021-01-14 10:22:01 +05:30 |
|
|
a94ed927aa
|
gpt links
|
2021-01-14 10:20:21 +05:30 |
|
|
2cf6e7a079
|
colab notebook
|
2021-01-14 10:18:27 +05:30 |
|
|
e367505720
|
feedback experiment fix
|
2021-01-14 10:02:18 +05:30 |
|
|
55ec434132
|
gpt notes
|
2021-01-14 09:38:16 +05:30 |
|
|
2927aa217b
|
gpt notes
|
2021-01-14 09:37:12 +05:30 |
|
|
4c769128cb
|
autoregression trainer notes
|
2021-01-14 08:46:41 +05:30 |
|
|
fbb1026164
|
weight decouple fix
|
2021-01-13 20:33:25 +05:30 |
|
|
774a72e0bf
|
gpt
|
2021-01-13 12:54:43 +05:30 |
|
|
a11e3efff2
|
Update readme.md
|
2021-01-13 08:37:04 +05:30 |
|
|
193a471217
|
Update readme.md
|
2021-01-13 08:36:40 +05:30 |
|
|
0bc13a92ce
|
Update readme.md
|
2021-01-13 08:35:22 +05:30 |
|
|
fff2034fa2
|
Update readme.md
|
2021-01-10 18:08:50 +05:30 |
|
|
0de6605c80
|
experiment notebook
|
2021-01-10 12:19:18 +05:30 |
|
|
9102883e1f
|
transpose with \top
|
2021-01-10 12:16:50 +05:30 |
|
|
8ee70da198
|
feedback link
|
2021-01-10 11:52:08 +05:30 |
|
|
3ede1c3460
|
fix
|
2021-01-10 11:34:28 +05:30 |
|
|
1dc4ff825f
|
feedback transformer notes
|
2021-01-10 10:22:46 +05:30 |
|
|
5874106161
|
feedback rtansformer notes
|
2021-01-09 21:06:41 +05:30 |
|
|
fa5805f275
|
relative mha
|
2021-01-09 10:52:49 +05:30 |
|
|
809a54d6aa
|
relative attention notes
|
2021-01-09 10:41:25 +05:30 |
|
|
9f4b494bf2
|
feedback transformer
|
2021-01-09 07:28:25 +05:30 |
|
|
ce190701e8
|
global step
|
2021-01-07 21:11:50 +05:30 |
|
|
c124348b14
|
gradient clipping
|
2021-01-07 13:33:32 +05:30 |
|
|
dfefde657b
|
no loss smoothing
|
2021-01-07 12:02:19 +05:30 |
|
|
b9da12ee3f
|
d_model
|
2021-01-06 17:24:09 +05:30 |
|
|
605ad0fdde
|
minor improvements
|
2021-01-03 14:39:01 +05:30 |
|
|
4cb730d579
|
fix
|
2021-01-03 14:33:16 +05:30 |
|
|
a962cc320e
|
fix
|
2021-01-03 14:28:07 +05:30 |
|
|
724ff555b3
|
Merge branch 'master' of github.com:lab-ml/labml_nn
merge
|
2021-01-03 14:20:28 +05:30 |
|
|
9907e03742
|
typo fix
|
2021-01-03 14:19:52 +05:30 |
|
|
4557175314
|
Update hyper_lstm.py
|
2021-01-03 14:19:41 +05:30 |
|
|
6fe86efdff
|
badgeg
|
2021-01-03 12:16:01 +05:30 |
|
|
927acc2d81
|
hypernetworks link
|
2021-01-03 11:22:02 +05:30 |
|
|
979b01adc2
|
update experiment
|
2021-01-03 11:20:30 +05:30 |
|
|
bead174ed4
|
notebook
|
2021-01-03 11:12:55 +05:30 |
|
|
600c8590f4
|
hyperlstm notes
|
2021-01-03 11:07:12 +05:30 |
|
|
7d3c6fcd41
|
lstm chunk
|
2020-12-28 16:14:12 +05:30 |
|
|
814fd565c0
|
hyper lstm experiment
|
2020-12-28 16:02:47 +05:30 |
|
|
52d5b5fbf6
|
auto regression common exp
|
2020-12-27 07:35:35 +05:30 |
|
|
4fe8392a8d
|
auto regression common exp
|
2020-12-27 07:30:20 +05:30 |
|
|
c64b98e390
|
basic auto regression experiment for reuse
|
2020-12-26 21:12:44 +05:30 |
|
|
a6502de621
|
shuffle data
|
2020-12-26 20:46:58 +05:30 |
|
|
716dda5f3b
|
fix lr
|
2020-12-26 16:44:11 +05:30 |
|
|
48277e9334
|
hyperlstm
|
2020-12-26 15:49:44 +05:30 |
|
|
3e798f38f9
|
Update readme.md
|
2020-12-23 16:11:22 +05:30 |
|
|
b05faa9b98
|
default warm up
|
2020-12-23 13:57:34 +05:30 |
|
|
634809af3c
|
noam chart fix
|
2020-12-23 13:52:08 +05:30 |
|