|
092b8ddaf4
|
multiplication
|
2022-06-09 17:25:02 +05:30 |
|
|
0ce0aba12a
|
refractor
|
2022-06-09 15:24:13 +05:30 |
|
|
cd4e59840e
|
refractor
|
2022-06-09 15:20:08 +05:30 |
|
|
3582cc97cf
|
results
|
2022-06-08 14:45:24 +05:30 |
|
|
af233cfd73
|
copy multiple
|
2022-06-07 14:00:12 +05:30 |
|
|
680b8e5734
|
0/1
|
2022-06-05 16:32:31 +05:30 |
|
|
fa10e7a149
|
copy
|
2022-06-05 06:07:46 +05:30 |
|
|
d915314947
|
experiment
|
2022-06-03 20:45:18 +05:30 |
|
|
1a3482857d
|
arithmetic dataset notes
|
2022-06-03 17:08:22 +05:30 |
|
|
7b492eca71
|
with explanaitons only
|
2022-06-03 16:55:25 +05:30 |
|
|
104070806e
|
logs
|
2022-06-02 16:15:43 +05:30 |
|
|
e409e9bf98
|
arthmetic test score
|
2022-06-01 14:07:27 +05:30 |
|
|
c08af45b03
|
experiment
|
2022-05-31 22:39:58 +05:30 |
|
|
13686c1d28
|
arithmetic exp
|
2022-05-31 18:07:54 +05:30 |
|
|
367da28267
|
arithmetic dataset
|
2022-05-31 08:32:12 +05:30 |
|
|
aa311eb30d
|
experiemnt logs
|
2022-05-03 09:12:18 +01:00 |
|
|
a7a7a3bdb7
|
RETRO (#110)
|
2022-03-12 15:44:35 +05:30 |
|
|
6cd0ed168e
|
update torch
|
2021-10-29 09:05:59 +05:30 |
|
|
76ae56ff15
|
highlight code in notes
|
2021-10-22 18:34:59 +05:30 |
|
|
dc4da2106b
|
headings
|
2021-10-21 15:15:05 +05:30 |
|
|
c5b13162cf
|
anchors
|
2021-10-21 15:01:58 +05:30 |
|
|
d4b4c28840
|
typo fixes
|
2021-10-19 19:17:51 +05:30 |
|
|
6615c7158a
|
Primer EZ (#96)
|
2021-09-21 16:01:26 +05:30 |
|
|
02992a43ab
|
cleanup
|
2021-08-27 20:49:33 +05:30 |
|
|
a4c720debf
|
short long
|
2021-08-27 17:00:00 +05:30 |
|
|
eaa248c9e6
|
__call__ -> forward
|
2021-08-19 15:45:59 +05:30 |
|
|
876845d0c2
|
ResNet (#68)
|
2021-07-16 08:35:46 +05:30 |
|
|
1a9f15eebb
|
Distillation (#65)
|
2021-07-03 14:01:17 +05:30 |
|
|
7f05ed043b
|
FNet (#53)
|
2021-05-26 10:56:42 +05:30 |
|
|
2edf17fa8c
|
✨ group norm
|
2021-04-20 13:40:26 +05:30 |
|
|
983286e216
|
📚 batch norm
|
2021-02-01 14:43:11 +05:30 |
|
|
20d2e27a3c
|
📚 ffn notes
|
2021-01-25 22:09:11 +05:30 |
|
|
2927aa217b
|
gpt notes
|
2021-01-14 09:37:12 +05:30 |
|
|
4c769128cb
|
autoregression trainer notes
|
2021-01-14 08:46:41 +05:30 |
|
|
774a72e0bf
|
gpt
|
2021-01-13 12:54:43 +05:30 |
|
|
ce190701e8
|
global step
|
2021-01-07 21:11:50 +05:30 |
|
|
c124348b14
|
gradient clipping
|
2021-01-07 13:33:32 +05:30 |
|
|
dfefde657b
|
no loss smoothing
|
2021-01-07 12:02:19 +05:30 |
|
|
b9da12ee3f
|
d_model
|
2021-01-06 17:24:09 +05:30 |
|
|
4fe8392a8d
|
auto regression common exp
|
2020-12-27 07:30:20 +05:30 |
|
|
c64b98e390
|
basic auto regression experiment for reuse
|
2020-12-26 21:12:44 +05:30 |
|