fixed DescentWeightDecay parameters
This commit is contained in:
parent
d8394298bb
commit
1f0f2a5ac2
@ -226,7 +226,7 @@ end
|
|||||||
|
|
||||||
[ADAMW](https://arxiv.org/abs/1711.05101) fixing weight decay regularization in Adam.
|
[ADAMW](https://arxiv.org/abs/1711.05101) fixing weight decay regularization in Adam.
|
||||||
"""
|
"""
|
||||||
ADAMW(η = 0.001, β = (0.9, 0.999), η_decay = 1, γ_decay = 0) = Optimiser(ADAM(η, β, IdDict()), DescentWeightDecay(η_decay, γ_decay))
|
ADAMW(η = 0.001, β = (0.9, 0.999), η_decay = 1, wd = 0) = Optimiser(ADAM(η, β, IdDict()), DescentWeightDecay(η_decay, wd))
|
||||||
|
|
||||||
# Compose optimizers
|
# Compose optimizers
|
||||||
|
|
||||||
@ -292,4 +292,4 @@ function update!(o::WeightDecay, x, Δ)
|
|||||||
@. Δ += wd * x
|
@. Δ += wd * x
|
||||||
end
|
end
|
||||||
|
|
||||||
DescentWeightDecay(η = 0.1, γ = 0) = Optimiser(WeightDecay(), Descent(η))
|
DescentWeightDecay(η = 1, wd = 0) = Optimiser(WeightDecay(1, wd), Descent(η))
|
Loading…
Reference in New Issue
Block a user