Merge pull request #100 from agdestein/revision

Revision
agdestein · Nov 2, 2024 · add4243 · add4243
2 parents 35346e4 + 3407eff
commit add4243
Show file tree

Hide file tree

Showing 27 changed files with 3,073 additions and 2,103 deletions.
diff --git a/docs/src/components/GalleryImage.vue b/docs/src/components/GalleryImage.vue
@@ -17,7 +17,7 @@ defineProps<Props>();
 <template>
     <div class="img-box">
         <a :href="href">
-            <img :src="withBase(src)" heigth="100px" alt="">
+            <img :src="withBase(src)" height="100px" alt="">
             <div class="transparent-box1">
                 <div class="caption">
                     <h2>{{ caption }}</h2>

diff --git a/docs/src/manual/time.md b/docs/src/manual/time.md
@@ -76,6 +76,7 @@ AbstractRungeKuttaMethod
 ExplicitRungeKuttaMethod
 ImplicitRungeKuttaMethod
 RKMethods
+LMWray3
 ```
 
 ### Explicit Methods

diff --git a/lib/NeuralClosure/Project.toml b/lib/NeuralClosure/Project.toml
@@ -11,15 +11,17 @@ IncompressibleNavierStokes = "5e318141-6589-402b-868d-77d7df8c442e"
 KernelAbstractions = "63c18a36-062a-441e-b654-da1e3ab1ce7c"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 Lux = "b2108857-7c20-44ae-9111-449ecde12c47"
+MLUtils = "f1d291b0-491e-4a28-83b9-f70985020b54"
 Makie = "ee78f7c6-11fb-53f2-987a-cfe4a2b5a57a"
 NNlib = "872c559c-99b0-510c-b3b7-b6c96a88d5cd"
 Observables = "510215fc-4207-5dde-b226-833fc4488ee2"
 Optimisers = "3bd65402-5787-11e9-1adc-39752487f4e2"
+Printf = "de0858da-6303-5e67-8744-51eddeeeb8d7"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f"
 
-[sources.IncompressibleNavierStokes] 
-path = "../.."
+[sources]
+IncompressibleNavierStokes = {path = "../.."}
 
 [compat]
 Accessors = "0.1"
@@ -29,10 +31,12 @@ IncompressibleNavierStokes = "1"
 KernelAbstractions = "0.9"
 LinearAlgebra = "1"
 Lux = "1"
+MLUtils = "0.4"
 Makie = "0.21"
 NNlib = "0.9"
 Observables = "0.5"
 Optimisers = "0.3"
+Printf = "1"
 Random = "1"
 Zygote = "0.6"
 julia = "1.9"
diff --git a/lib/NeuralClosure/src/NeuralClosure.jl b/lib/NeuralClosure/src/NeuralClosure.jl
@@ -12,9 +12,11 @@ using KernelAbstractions
 using LinearAlgebra
 using Lux
 using Makie
+using MLUtils
 using NNlib
 using Observables
 using Optimisers
+using Printf
 using Random
 using Zygote
 
@@ -30,12 +32,9 @@ include("filter.jl")
 include("data_generation.jl")
 
 export cnn, gcnn, fno, FourierLayer, GroupConv2D, rot2, rot2stag
-export train
-export mean_squared_error,
-    create_relerr_prior,
-    create_relerr_post,
-    create_relerr_symmetry_prior,
-    create_relerr_symmetry_post
+export train, trainepoch
+export create_relerr_prior,
+    create_relerr_post, create_relerr_symmetry_prior, create_relerr_symmetry_post
 export create_loss_prior, create_loss_post
 export create_dataloader_prior, create_dataloader_post
 export create_callback, create_les_data, create_io_arrays

diff --git a/lib/NeuralClosure/src/data_generation.jl b/lib/NeuralClosure/src/data_generation.jl
@@ -84,7 +84,7 @@ filtersaver(
         #     # Overwrite LES body force field with filtered DNS bodyforce.
         #     # In principle, they should be very similar, but the original LES
         #     # body force field is obtained with pointwise evaluation,
-        #     # while the one appearing in the filterd DNS equation is
+        #     # while the one appearing in the filtered DNS equation is
         #     # discretely filtered.
         #     @assert les.issteadybodyforce
         #     Φ(les.bodyforce, dns.bodyforce, les, compression)
@@ -167,6 +167,7 @@ function create_les_data(;
     (; u, t), outputs = solve_unsteady(;
         setup = dns,
         ustart,
+        docopy = false, # Overwrite initial conditions to save memory
         tlims = (T(0), tburn),
         Δt,
         method,
@@ -180,6 +181,7 @@ function create_les_data(;
     _, outputs = solve_unsteady(;
         setup = dns,
         ustart = u,
+        docopy = false, # Overwrite initial conditions to save memory
         tlims = (T(0), tsim),
         Δt,
         method,
@@ -195,10 +197,10 @@ function create_les_data(;
                 psolver_les;
                 nupdate = savefreq,
 
-                # Reuse arrays from cache.
+                # Reuse arrays from cache to save memory in 3D DNS.
                 # Since processors are called outside
                 # Runge-Kutta steps, there is no danger
-                # in overwriteng the arrays.
+                # in overwriting the arrays.
                 F = cache.u₀,
                 p = cache.p,
             ),

diff --git a/lib/NeuralClosure/src/training.jl b/lib/NeuralClosure/src/training.jl
@@ -3,27 +3,38 @@ Create dataloader that uses a batch of `batchsize` random samples from
 `data` at each evaluation.
 The batch is moved to `device`.
 """
-create_dataloader_prior(data; batchsize = 50, device = identity) = function dataloader(rng)
+function create_dataloader_prior(data; batchsize = 50, device = identity)
     x, y = data
     nsample = size(x)[end]
     d = ndims(x)
-    i = sort(shuffle(rng, 1:nsample)[1:batchsize])
-    xuse = device(Array(selectdim(x, d, i)))
-    yuse = device(Array(selectdim(y, d, i)))
-    (xuse, yuse), rng
+    xcpu = Array(selectdim(x, d, 1:batchsize))
+    ycpu = Array(selectdim(y, d, 1:batchsize))
+    xuse = xcpu |> device
+    yuse = ycpu |> device
+    function dataloader(rng)
+        i = sort(shuffle(rng, 1:nsample)[1:batchsize])
+        copyto!(xcpu, selectdim(x, d, i))
+        copyto!(ycpu, selectdim(y, d, i))
+        copyto!(xuse, xcpu)
+        copyto!(yuse, ycpu)
+        (xuse, yuse), rng
+    end
 end
 
 """
 Create trajectory dataloader.
 """
-create_dataloader_post(trajectories; nunroll = 10, device = identity) =
+create_dataloader_post(trajectories; ntrajectory, nunroll, device = identity) =
     function dataloader(rng)
-        (; u, t) = rand(rng, trajectories)
-        nt = length(t)
-        @assert nt ≥ nunroll
-        istart = rand(rng, 1:nt-nunroll)
-        it = istart:istart+nunroll
-        (; u = device.(u[it]), t = t[it]), rng
+        batch = shuffle(rng, trajectories)[1:ntrajectory] # Select a subset of trajectories
+        data = map(batch) do (; u, t)
+            nt = length(t)
+            @assert nt ≥ nunroll "Trajectory too short for nunroll = $nunroll"
+            istart = rand(rng, 1:nt-nunroll)
+            it = istart:istart+nunroll
+            (; u = device.(u[it]), t = t[it])
+        end
+        data, rng
     end
 
 """
@@ -33,11 +44,12 @@ optimiser `opt` for `niter` iterations.
 Return the a new named tuple `(; opt, θ, callbackstate)` with
 updated state and parameters.
 """
-function train(; dataloader, loss, trainstate, niter = 100, callback, callbackstate)
-    for i = 1:niter
+function train(; dataloader, loss, trainstate, niter, callback, callbackstate, λ = nothing)
+    for _ = 1:niter
         (; optstate, θ, rng) = trainstate
         batch, rng = dataloader(rng)
         g, = gradient(θ -> loss(batch, θ), θ)
+        isnothing(λ) || @.(g += λ * θ) # Weight decay
         optstate, θ = Optimisers.update!(optstate, θ, g)
         trainstate = (; optstate, θ, rng)
         callbackstate = callback(callbackstate, trainstate)
@@ -46,72 +58,92 @@ function train(; dataloader, loss, trainstate, niter = 100, callback, callbackst
 end
 
 """
-Wrap loss function `loss(batch, θ)`.
+Update parameters `θ` to minimize `loss(dataloader(), θ)` using the
+optimiser `opt` for `niter` iterations.
 
-The function `loss` should take inputs like `loss(f, x, y, θ)`.
+Return the a new named tuple `(; opt, θ, callbackstate)` with
+updated state and parameters.
 """
-create_loss_prior(loss, f) = ((x, y), θ) -> loss(f, x, y, θ)
+function trainepoch(;
+    dataloader,
+    loss,
+    trainstate,
+    callback,
+    callbackstate,
+    device,
+    noiselevel,
+    λ = nothing,
+)
+    (; batchsize, data) = dataloader
+    x = data[1]
+    x = selectdim(x, ndims(x), 1:batchsize) |> Array |> device
+    y = copy(x)
+    noisebuf = copy(x)
+    batch = (x, y)
+    for batch_cpu in dataloader
+        (; optstate, θ, rng) = trainstate
+        copyto!.(batch, batch_cpu)
+        if !isnothing(noiselevel)
+            # Add noise to input
+            x, y = batch
+            randn!(rng, noisebuf)
+            @. x += noiselevel * noisebuf
+            batch = x, y
+        end
+        g, = gradient(θ -> loss(batch, θ), θ)
+        isnothing(λ) || @.(g += λ * θ) # Weight decay
+        optstate, θ = Optimisers.update!(optstate, θ, g)
+        trainstate = (; optstate, θ, rng)
+        callbackstate = callback(callbackstate, trainstate)
+    end
+    (; trainstate, callbackstate)
+end
+
+"Return mean squared error loss for the predictor `f`."
+function create_loss_prior(f, normalize = y -> sum(abs2, y))
+    loss_prior((x, y), θ) = sum(abs2, f(x, θ) - y) / normalize(y)
+end
 
 """
 Create a-priori error.
 """
 create_relerr_prior(f, x, y) = θ -> norm(f(x, θ) - y) / norm(y)
 
-"""
-Compute MSE between `f(x, θ)` and `y`.
-
-The MSE is further divided by `normalize(y)`.
-"""
-mean_squared_error(f, x, y, θ; normalize = y -> sum(abs2, y), λ = sqrt(eltype(x)(1e-8))) =
-    sum(abs2, f(x, θ) - y) / normalize(y) + λ * sum(abs2, θ)
-
 """
 Create a-posteriori loss function.
 """
-function create_loss_post(;
-    setup,
-    method = RKMethods.RK44(; T = eltype(setup.grid.x[1])),
-    psolver,
-    closure,
-    nupdate = 1,
-)
+function create_loss_post(; setup, method, psolver, closure, nsubstep = 1)
     closure_model = wrappedclosure(closure, setup)
     setup = (; setup..., closure_model)
-    (; dimension, Iu) = setup.grid
+    (; dimension, Iu, x) = setup.grid
     D = dimension()
-    function loss_post(data, θ)
-        T = eltype(θ)
-        (; u, t) = data
-        v = u[1]
-        stepper = create_stepper(method; setup, psolver, u = v, temp = nothing, t = t[1])
-        loss = zero(eltype(v[1]))
-        for it = 2:length(t)
-            Δt = (t[it] - t[it-1]) / nupdate
-            for isub = 1:nupdate
-                stepper = timestep(method, stepper, Δt; θ)
-            end
-            a, b = T(0), T(0)
-            for α = 1:length(u[1])
-                a += sum(abs2, (stepper.u[α]-u[it][α])[Iu[α]])
-                b += sum(abs2, u[it][α][Iu[α]])
+    loss_post(data, θ) =
+        sum(data) do (; u, t)
+            T = eltype(θ)
+            v = u[1]
+            stepper =
+                create_stepper(method; setup, psolver, u = v, temp = nothing, t = t[1])
+            loss = zero(T)
+            for it = 2:length(t)
+                Δt = (t[it] - t[it-1]) / nsubstep
+                for isub = 1:nsubstep
+                    stepper = timestep(method, stepper, Δt; θ)
+                end
+                a, b = T(0), T(0)
+                for α = 1:length(u[1])
+                    a += sum(abs2, (stepper.u[α]-u[it][α])[Iu[α]])
+                    b += sum(abs2, u[it][α][Iu[α]])
+                end
+                loss += a / b
             end
-            loss += a / b
-        end
-        loss / (length(t) - 1)
-    end
+            loss / (length(t) - 1)
+        end / length(data)
 end
 
 """
 Create a-posteriori relative error.
 """
-function create_relerr_post(;
-    data,
-    setup,
-    method = RKMethods.RK44(; T = eltype(setup.grid.x[1])),
-    psolver,
-    closure_model,
-    nupdate = 1,
-)
+function create_relerr_post(; data, setup, method, psolver, closure_model, nsubstep = 1)
     setup = (; setup..., closure_model)
     (; dimension, Iu) = setup.grid
     D = dimension()
@@ -124,8 +156,8 @@ function create_relerr_post(;
         stepper = create_stepper(method; setup, psolver, u = v, temp = nothing, t = t[1])
         e = zero(T)
         for it = 2:length(t)
-            Δt = (t[it] - t[it-1]) / nupdate
-            for isub = 1:nupdate
+            Δt = (t[it] - t[it-1]) / nsubstep
+            for isub = 1:nsubstep
                 stepper =
                     IncompressibleNavierStokes.timestep!(method, stepper, Δt; θ, cache)
             end
@@ -240,15 +272,22 @@ function create_callback(
     obs[] = callbackstate.hist
     displayfig && display(fig)
     function callback(callbackstate, trainstate)
-        @reset callbackstate.n += 1
         (; n, hist) = callbackstate
         if n % nupdate == 0
             (; θ) = trainstate
             e = err(θ)
             newtime = time()
             itertime = (newtime - callbackstate.ctime) / nupdate
             @reset callbackstate.ctime = newtime
-            @info "Iteration $n \t relative error: $e \t sec/iter: $itertime"
+            @info join(
+                [
+                    "Iteration $n",
+                    @sprintf("relative error: %.4g", e),
+                    @sprintf("sec/iter: %.4g", itertime),
+                    @sprintf("eta: %.4g", getlearningrate(trainstate.optstate.rule)),
+                ],
+                "\t",
+            )
             hist = push!(copy(hist), Point2f(n, e))
             @reset callbackstate.hist = hist
             obs[] = hist
@@ -261,7 +300,12 @@ function create_callback(
                 @reset callbackstate.emin = e
             end
         end
+        @reset callbackstate.n += 1
         callbackstate
     end
     (; callbackstate, callback)
 end
+
+getlearningrate(r::Adam) = r.eta
+getlearningrate(r::OptimiserChain{Tuple{Adam,WeightDecay}}) = r.opts[1].eta
+getlearningrate(r) = -1