FluxML · DhairyaLGandhi · Feb 16, 2021 · Feb 16, 2021 · Feb 16, 2021 · Feb 16, 2021
diff --git a/src/schedulers.jl b/src/schedulers.jl
@@ -0,0 +1,67 @@
+# f(t, p) = (2 / π) * abs(asin(sin(π * (t - 1) / p)))
+# sine(t, p = 1.) = (2 / π) * abs(asin(sin(π * (t - 1) / p)))
+
+# Simple scheduling can happen as a basic closure.
+triangle(t) = (1 - 2 * abs(round(Int, t/2) - t/2))
+
+mutable struct Schedule{O,F}
+  f::F
+  opt::O
+  cursor::Float32
+end
+
+"""
+    Schedule(f, opt)
+
+Create a scheduled optimiser whose update rule is controlled by `f`.
+
+`f` can be any callable, while `opt` can be any optimiser.
+
+See also [next](@ref), [init](@ref)
+"""
+function Schedule(f, opt)
+  Schedule(f, opt, 1.f0 + eps(Float32)) 
+end
+
+
+# Timestep: t - always depends on run
+# Phase: p - mostly likely constant
+
+# What we want to "schedule" - everything (so will have to let people mess with things)
+# Most likely learning rate
+# If `f` relies on only time - it can be generated on the fly
+
+"""
+    next(s::Schedule, state)
+
+Returns a new optimiser as described by the scheduler function
+and the optimiser. This allocates a new optimiser on the stack, keeping the original one intact.
+
+The state is a tuple of the state as defined by the scheduling function.
+"""
+function next(s::Schedule{O}, (cursor, cursor_step)) where O
+  cursor += cursor_step
+  ADAM(s.opt, eta = s.f(cursor) * s.opt.eta) #replace with O(..)
+end
+
+init(f, x) = (1.f0, 0.1f0)
+init(s::Schedule, x) = (init(s.f, x), init(s.opt, x))
+
+function apply(s::Schedule, x, dx, st)
+  schedst, optst = st
+  cursor, cursor_step = schedst
+  o = next(s, schedst)
+  Δ, optst2 = apply(o, x, dx, optst)
+  Δ, ((cursor .+ cursor_step, cursor_step), optst2)
+end
+
+struct InvDecay{T}
+  decay::T
+end
+
+init(inv::InvDecay, x) = (1, 1)
+(inv::InvDecay)(t) = 1 / (1 + inv.decay * t)
+
+InvDecay(s = 0.1f0) = InvDecay{typeof(s)}(s)
+
+sine(p) = t -> sin(Float32(π) * t / p)