mirror of
				https://github.com/labmlai/annotated_deep_learning_paper_implementations.git
				synced 2025-10-31 18:58:43 +08:00 
			
		
		
		
	default warm up
This commit is contained in:
		| @ -30,7 +30,7 @@ class OptimizerConfigs(BaseConfigs): | ||||
|  | ||||
|     momentum: float = 0.5 | ||||
|     amsgrad: bool = False | ||||
|     warmup: int = 0 | ||||
|     warmup: int = 2_000 | ||||
|     degenerated_to_sgd: bool = True | ||||
|     rectify: bool = True | ||||
|     d_model: int | ||||
|  | ||||
		Reference in New Issue
	
	Block a user
	 Varuna Jayasiri
					Varuna Jayasiri