e6b3c8a6a2 
					 
					
						
						
							
							jax docs  
						
						
						
						
					 
					
						2025-08-21 12:34:04 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						dd4519878a 
					 
					
						
						
							
							sitemap  
						
						
						
						
					 
					
						2025-08-12 12:11:33 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						9262c57f18 
					 
					
						
						
							
							flash attention  
						
						
						
						
					 
					
						2025-08-08 19:57:57 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						4752644737 
					 
					
						
						
							
							all comments  
						
						
						
						
					 
					
						2025-08-01 15:50:27 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						73b9892be6 
					 
					
						
						
							
							all comments  
						
						
						
						
					 
					
						2025-08-01 13:56:39 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						5a8182d21b 
					 
					
						
						
							
							backward pass formulas  
						
						
						
						
					 
					
						2025-08-01 13:24:57 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						a9b5c923eb 
					 
					
						
						
							
							backward pass formulas  
						
						
						
						
					 
					
						2025-07-31 17:15:26 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						0ae6e6ae2a 
					 
					
						
						
							
							flash comments  
						
						
						
						
					 
					
						2025-07-31 14:49:37 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						1bc2a69803 
					 
					
						
						
							
							flash comments  
						
						
						
						
					 
					
						2025-07-31 09:53:14 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						c4d2e8cd22 
					 
					
						
						
							
							docs  
						
						
						
						
					 
					
						2025-07-31 08:48:07 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						49ea8f06cb 
					 
					
						
						
							
							paperswithcode.com list  
						
						
						
						
					 
					
						2024-08-24 10:56:04 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						3e6a4eca80 
					 
					
						
						
							
							LoRA Chinese docs  
						
						
						
						
					 
					
						2024-08-24 10:52:30 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						5731bff586 
					 
					
						
						
							
							LoRA docs  
						
						
						
						
					 
					
						2024-08-24 10:50:02 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						9e1b35716d 
					 
					
						
						
							
							LoRA GPT2 n_heads fix and notes  
						
						
						
						
					 
					
						2024-08-18 17:04:58 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						012fc7f0f0 
					 
					
						
						
							
							LoRA GPT2 n_heads fix and notes  
						
						
						
						
					 
					
						2024-08-18 16:25:21 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						d5768ba423 
					 
					
						
						
							
							LoRA typo fix  
						
						
						
						
					 
					
						2024-08-18 15:07:56 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						9dd97ff11a 
					 
					
						
						
							
							LoRA transpose  
						
						
						
						
					 
					
						2024-08-18 14:37:14 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						ce21dcf76c 
					 
					
						
						
							
							LoRA experiment  
						
						
						
						
					 
					
						2024-08-18 14:26:33 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						f3465ac926 
					 
					
						
						
							
							Chineese translation  
						
						
						
						
					 
					
						2024-08-16 16:35:25 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						edf875aa70 
					 
					
						
						
							
							LoRA experiment notes  
						
						
						
						
					 
					
						2024-08-16 16:25:19 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						d4af40b595 
					 
					
						
						
							
							LoRA notes  
						
						
						
						
					 
					
						2024-08-03 16:59:15 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						f6e913eb09 
					 
					
						
						
							
							transformer mha chinese translation  
						
						
						
						
					 
					
						2024-06-27 19:35:37 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						26e64a8827 
					 
					
						
						
							
							zh  
						
						
						
						
					 
					
						2024-06-24 15:59:56 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						20494ae94c 
					 
					
						
						
							
							fix gae formula  
						
						
						
						
					 
					
						2024-06-24 15:58:03 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						d858f2eec0 
					 
					
						
						
							
							remove tranding papers link  
						
						
						
						
					 
					
						2024-06-21 19:35:22 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						0bb4be3ff9 
					 
					
						
						
							
							zh translation  
						
						
						
						
					 
					
						2024-06-21 19:28:14 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						bf8a491250 
					 
					
						
						
							
							chineese translation  
						
						
						
						
					 
					
						2024-06-21 19:09:13 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						09d09379c2 
					 
					
						
						
							
							fix value pe double rotation  
						
						
						
						
					 
					
						2024-06-20 12:53:09 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						2236f6383c 
					 
					
						
						
							
							fix rope test code  
						
						
						
						
					 
					
						2024-06-20 12:49:27 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						cf565bcc1d 
					 
					
						
						
							
							cleanup  
						
						
						
						
					 
					
						2024-06-18 11:09:02 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						999f2036a5 
					 
					
						
						
							
							RWKV docs  
						
						
						
						
					 
					
						2024-03-17 17:47:51 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						df9e1af615 
					 
					
						
						
							
							RWKV docs  
						
						
						
						
					 
					
						2024-03-17 17:45:08 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						7db6e92376 
					 
					
						
						
							
							RWKV  ( #222 )  
						
						... 
						
						
						
						* rwkv-init
* annotations
* Re-added docs
* make dir if not exist
* Add RWKV paper and update doc index
* add train loop
* experiment
---------
Co-authored-by: Jacob Hatef <hatef.4@buckeyemail.buckeyemail.osu.edu>
Co-authored-by: Quentin Anthony <qganthony@yahoo.com> 
						
						
					 
					
						2024-03-17 17:36:15 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						285cb3735b 
					 
					
						
						
							
							uodate docs  
						
						
						
						
					 
					
						2024-03-02 14:33:53 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						a0679ecd90 
					 
					
						
						
							
							title  
						
						
						
						
					 
					
						2024-01-12 13:21:54 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						45dc127061 
					 
					
						
						
							
							Merge pull request  #235  from qiangxinglin/master  
						
						... 
						
						
						
						Fix typo chineese translation 
						
						
					 
					
						2024-01-12 13:18:50 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						81cf808d05 
					 
					
						
						
							
							rope typo  
						
						
						
						
					 
					
						2024-01-12 13:17:39 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						4135eda943 
					 
					
						
						
							
							title  
						
						
						
						
					 
					
						2024-01-12 13:15:04 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						fdd4da6401 
					 
					
						
						
							
							Fix typo  
						
						
						
						
					 
					
						2023-12-24 12:08:10 +08:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						b18a82213d 
					 
					
						
						
							
							docs  
						
						
						
						
					 
					
						2023-11-17 19:40:59 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						f42c0e9cf4 
					 
					
						
						
							
							right shift example comment fix  
						
						
						
						
					 
					
						2023-11-07 09:28:22 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						a2d6e805a6 
					 
					
						
						
							
							fix beta expression in ddpm docs  
						
						
						
						
					 
					
						2023-11-07 09:13:19 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						f26c603648 
					 
					
						
						
							
							update docs  
						
						
						
						
					 
					
						2023-11-07 09:10:13 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						ba58ad9720 
					 
					
						
						
							
							version  
						
						
						
						
					 
					
						2023-11-07 09:06:49 +00:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						9a42ac2697 
					 
					
						
						
							
							arxiv.org links  
						
						
						
						
					 
					
						2023-10-24 14:42:32 +01:00 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						753fbd3446 
					 
					
						
						
							
							typo fix docs  
						
						
						
						
					 
					
						2023-07-15 08:35:33 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						b43fb807a8 
					 
					
						
						
							
							sophia speed up  
						
						
						
						
					 
					
						2023-07-15 08:30:41 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						0101618de6 
					 
					
						
						
							
							links  
						
						
						
						
					 
					
						2023-07-14 21:27:44 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						8db330dd22 
					 
					
						
						
							
							sophia-g docs  
						
						
						
						
					 
					
						2023-07-14 21:25:08 +05:30 
						 
				 
			
				
					
						
					 
					
						
						
							
						
						e8a5febf01 
					 
					
						
						
							
							docs  
						
						
						
						
					 
					
						2023-06-30 17:21:53 +05:30