@@ -133,11 +133,11 @@ opt = RMSProp(0.002, 0.95)
133
133
mutable struct RMSProp <: AbstractOptimiser
134
134
eta:: Float64
135
135
rho:: Float64
136
- epsilon:: Float64
137
136
acc:: IdDict
137
+ epsilon:: Float64
138
138
end
139
139
140
- RMSProp (η = 0.001 , ρ = 0.9 , ϵ = ϵ) = RMSProp (η, ρ, ϵ, IdDict ())
140
+ RMSProp (η = 0.001 , ρ = 0.9 ; ϵ = ϵ) = RMSProp (η, ρ, IdDict (), ϵ )
141
141
142
142
function apply! (o:: RMSProp , x, Δ)
143
143
η, ρ = o. eta, o. rho
@@ -167,11 +167,11 @@ opt = ADAM(0.001, (0.9, 0.8))
167
167
mutable struct ADAM <: AbstractOptimiser
168
168
eta:: Float64
169
169
beta:: Tuple{Float64,Float64}
170
- epsilon:: Float64
171
170
state:: IdDict
171
+ epsilon:: Float64
172
172
end
173
173
174
- ADAM (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = ADAM (η, β, ϵ, IdDict ())
174
+ ADAM (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = ADAM (η, β, IdDict (), ϵ )
175
175
176
176
function apply! (o:: ADAM , x, Δ)
177
177
η, β = o. eta, o. beta
@@ -209,11 +209,11 @@ opt = RADAM(0.001, (0.9, 0.8))
209
209
mutable struct RADAM <: AbstractOptimiser
210
210
eta:: Float64
211
211
beta:: Tuple{Float64,Float64}
212
- epsilon:: Float64
213
212
state:: IdDict
213
+ epsilon:: Float64
214
214
end
215
215
216
- RADAM (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = RADAM (η, β, ϵ, IdDict ())
216
+ RADAM (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = RADAM (η, β, IdDict (), ϵ )
217
217
218
218
function apply! (o:: RADAM , x, Δ)
219
219
η, β = o. eta, o. beta
@@ -259,11 +259,11 @@ opt = AdaMax(0.001, (0.9, 0.995))
259
259
mutable struct AdaMax <: AbstractOptimiser
260
260
eta:: Float64
261
261
beta:: Tuple{Float64,Float64}
262
- epsilon:: Float64
263
262
state:: IdDict
263
+ epsilon:: Float64
264
264
end
265
265
266
- AdaMax (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = AdaMax (η, β, ϵ, IdDict ())
266
+ AdaMax (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = AdaMax (η, β, IdDict (), ϵ )
267
267
268
268
function apply! (o:: AdaMax , x, Δ)
269
269
η, β = o. eta, o. beta
@@ -302,11 +302,11 @@ opt = OADAM(0.001, (0.9, 0.995))
302
302
mutable struct OADAM <: AbstractOptimiser
303
303
eta:: Float64
304
304
beta:: Tuple{Float64,Float64}
305
- epsilon:: Float64
306
305
state:: IdDict
306
+ epsilon:: Float64
307
307
end
308
308
309
- OADAM (η = 0.001 , β = (0.5 , 0.9 ), ϵ = ϵ) = OADAM (η, β, ϵ, IdDict ())
309
+ OADAM (η = 0.001 , β = (0.5 , 0.9 ); ϵ = ϵ) = OADAM (η, β, IdDict (), ϵ )
310
310
311
311
function apply! (o:: OADAM , x, Δ)
312
312
η, β = o. eta, o. beta
@@ -345,11 +345,11 @@ opt = ADAGrad(0.001)
345
345
"""
346
346
mutable struct ADAGrad <: AbstractOptimiser
347
347
eta:: Float64
348
- epsilon:: Float64
349
348
acc:: IdDict
349
+ epsilon:: Float64
350
350
end
351
351
352
- ADAGrad (η = 0.1 , ϵ = ϵ) = ADAGrad (η, ϵ, IdDict ())
352
+ ADAGrad (η = 0.1 ; ϵ = ϵ) = ADAGrad (η, IdDict (), ϵ )
353
353
354
354
function apply! (o:: ADAGrad , x, Δ)
355
355
η = o. eta
@@ -377,11 +377,11 @@ opt = ADADelta(0.89)
377
377
"""
378
378
mutable struct ADADelta <: AbstractOptimiser
379
379
rho:: Float64
380
- epsilon:: Float64
381
380
state:: IdDict
381
+ epsilon:: Float64
382
382
end
383
383
384
- ADADelta (ρ = 0.9 , ϵ = ϵ) = ADADelta (ρ, ϵ, IdDict ())
384
+ ADADelta (ρ = 0.9 ; ϵ = ϵ) = ADADelta (ρ, IdDict (), ϵ )
385
385
386
386
function apply! (o:: ADADelta , x, Δ)
387
387
ρ = o. rho
@@ -416,11 +416,11 @@ opt = AMSGrad(0.001, (0.89, 0.995))
416
416
mutable struct AMSGrad <: AbstractOptimiser
417
417
eta:: Float64
418
418
beta:: Tuple{Float64, Float64}
419
- epsilon:: Float64
420
419
state:: IdDict
420
+ epsilon:: Float64
421
421
end
422
422
423
- AMSGrad (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = AMSGrad (η, β, ϵ, IdDict ())
423
+ AMSGrad (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = AMSGrad (η, β, IdDict (), ϵ )
424
424
425
425
function apply! (o:: AMSGrad , x, Δ)
426
426
η, β = o. eta, o. beta
@@ -457,11 +457,11 @@ opt = NADAM(0.002, (0.89, 0.995))
457
457
mutable struct NADAM <: AbstractOptimiser
458
458
eta:: Float64
459
459
beta:: Tuple{Float64, Float64}
460
- epsilon:: Float64
461
460
state:: IdDict
461
+ epsilon:: Float64
462
462
end
463
463
464
- NADAM (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = NADAM (η, β, ϵ, IdDict ())
464
+ NADAM (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = NADAM (η, β, IdDict (), ϵ )
465
465
466
466
function apply! (o:: NADAM , x, Δ)
467
467
η, β = o. eta, o. beta
@@ -524,11 +524,11 @@ opt = AdaBelief(0.001, (0.9, 0.8))
524
524
mutable struct AdaBelief
525
525
eta:: Float64
526
526
beta:: Tuple{Float64,Float64}
527
- epsilon:: Float64
528
527
state:: IdDict
528
+ epsilon:: Float64
529
529
end
530
530
531
- AdaBelief (η = 0.001 , β = (0.9 , 0.999 ), ϵ = ϵ) = AdaBelief (η, β, ϵ, IdDict ())
531
+ AdaBelief (η = 0.001 , β = (0.9 , 0.999 ); ϵ = ϵ) = AdaBelief (η, β, IdDict (), ϵ )
532
532
533
533
function apply! (o:: AdaBelief , x, Δ)
534
534
η, β = o. eta, o. beta
0 commit comments