summerschool_simtech_2023/material/5_fri/optimizing_julia/optimizing_julia.jl

# # Optimizing Julia code

# This session provides an introduction to optimizing Julia code.
# The examples are developed with Julia v1.9.3.

# First, we install all required packages
import Pkg
Pkg.activate(@__DIR__)
Pkg.instantiate()

# The markdown file is created from the source code using
# [Literate.jl](https://github.com/fredrikekre/Literate.jl).
# You can create the markdown file via

using Literate
Literate.markdown(joinpath(@__DIR__, "optimizing_julia.jl");
                  flavor = Literate.CommonMarkFlavor())


# ## Basics
#
# The Julia manual contains basic information about performance.
# In particular, you should be familiar with
#
# - https://docs.julialang.org/en/v1/manual/performance-tips/
# - https://docs.julialang.org/en/v1/manual/style-guide/
#
# if you care about performance.


# ## Example: A linear advection simulation
#
# This is a classical partial differential equation (PDE) simulation setup.
# If you are not familiar with it, just ignore what's going on - but we need
# an example. This one is similar to several problematic cases I have seen
# in practice.

# First, we generate initial data and store it in a file.
using HDF5
x = range(-1.0, 1.0, length = 1000)
dx = step(x)
h5open("initial_data.h5", "w") do io
    u0 = sinpi.(x)
    write_dataset(io, "x", collect(x))
    write_dataset(io, "u0", u0)
end

# Next, we write our simulation code as a function - as we have learned from
# the performance tips!
function simulate()
    x, u0 = h5open("initial_data.h5", "r") do io
        read_dataset(io, "x"), read_dataset(io, "u0")
    end

    t = 0
    u = u0
    while t < t_end
        u = u + dt * rhs(u)
        t = t + dt
    end

    return t, x, u, u0
end

function rhs(u)
    du = similar(u)
    for i in eachindex(u)
        im1 = i == firstindex(u) ? lastindex(u) : (i - 1)
        du[i] = -(u[i] - u[im1]) / dx
    end
    return du
end

# Now, we can define our parameters, run a simulation,
# and plot the results.
using Plots, LaTeXStrings

t_end = 2.5
dt = 0.9 * dx
t, x, u, u0 = simulate()
plot(x, u0; label = L"u_0", xguide = L"x")
plot!(x, u; label = L"u")

# Maybe you can already spot problems in the code above.
# Anyway, before you begin optimizing some code, you should
# test it and make sure it's correct. Let's assume this is the
# case here. You should write tests making sure that the code
# continues to work as expected while we optimize it. We will
# not do this here right now.


# ## Profiling
#
# First, we need to measure the performance of our code to
# see whether it's already reasonable. For this, you can use
# `@time` - or better BenchmarkTools.jl.

using BenchmarkTools
@benchmark simulate()

# This shows quite a lot of allocations - typically a bad sign
# if you are working with numerical simulations.

# There are also profiling tools available in Julia.
# Some of them are already loaded in the Visual Studio Code
# extension for Julia. If you prefer working in the REPL,
# you can install ProfileView.jl (`@profview simulate()`) and
# PProf.jl (`pprof()` after creating a profile via `@profview`).

@profview simulate()

# Task: Optimize the code!


# ## Introduction to generic Julia code and AD
#
# One of the strengths of Julia is that you can use quite a few
# modern tools like AD. However, you need to learn Julia a bit
# to use everything efficiently.
# Here, we concentrate on ForwardDiff.jl.

using ForwardDiff
using Statistics

function foo0(x)
    vector = zeros(typeof(x), 100)
    foo0!(vector, x)
end

function foo0!(vector, scalar)
    for i in eachindex(vector)
        vector[i] = atan(i * scalar) / π
    end

    for _ in 1:1000
        for i in eachindex(vector)
            vector[i] = cos(vector[i])
        end
    end

    return mean(vector)
end

let x = 2 * π
    @show foo0(x)
    @show ForwardDiff.derivative(foo0, x)
    @benchmark foo0($x)
end


# The code above is basically a fixed point iteration.
# By doing some analysis, one could figure out that it
# should converge to the solution `x` of `x == cos(x)`,
# the "Dottie number". See https://en.wikipedia.org/wiki/Dottie_number

using SimpleNonlinearSolve

function dottie_number()
    f(u, p) = cos(u) - u
    bounds = (0.0, 2.0)
    prob = IntervalNonlinearProblem(f, bounds)
    sol = solve(prob, ITP())
    return sol.u
end

dottie_number()


# Next, we introduce a custom struct. Can you spot the problems?

struct MyData1
    scalar
    vector
end

function foo1(x)
    data = MyData1(x, zeros(typeof(x), 100))
    foo1!(data)
end

function foo1!(data)
    (; scalar, vector) = data

    for i in eachindex(vector)
        vector[i] = atan(i * scalar) / π
    end

    for _ in 1:1000
        for i in eachindex(vector)
            vector[i] = cos(vector[i])
        end
    end

    return mean(vector)
end

let x = 2 * π
    @show foo1(x)
    @show ForwardDiff.derivative(foo1, x)
    @benchmark foo1($x)
end


# We can fix type instabilities by introducing types explicitly.
# But we lose the possibility to use AD this way!

struct MyData2
    scalar::Float64
    vector::Vector{Float64}
end

function foo2(x)
    data = MyData2(x, zeros(typeof(x), 100))
    foo1!(data)
end

let x = 2 * π
    @show foo2(x)
    @benchmark foo2($x)
end

let x = 2 * π
    ForwardDiff.derivative(foo2, x)
end

# Thus, we need parametric types!

struct MyData3{T}
    scalar::T
    vector::Vector{T}
end

function foo3(x)
    data = MyData3(x, zeros(typeof(x), 100))
    foo1!(data)
end

let x = 2 * π
    @show foo3(x)
    @show ForwardDiff.derivative(foo3, x)
    @benchmark foo3($x)
end
add draft of material for Friday 2023-10-11 16:14:21 +02:00			`# # Optimizing Julia code`

			`# This session provides an introduction to optimizing Julia code.`
			`# The examples are developed with Julia v1.9.3.`

			`# First, we install all required packages`
			`import Pkg`
			`Pkg.activate(@__DIR__)`
			`Pkg.instantiate()`

			`# The markdown file is created from the source code using`
			`# [Literate.jl](https://github.com/fredrikekre/Literate.jl).`
			`# You can create the markdown file via`

			`using Literate`
			`Literate.markdown(joinpath(@__DIR__, "optimizing_julia.jl");`
			`flavor = Literate.CommonMarkFlavor())`


			`# ## Basics`
			`#`
			`# The Julia manual contains basic information about performance.`
			`# In particular, you should be familiar with`
			`#`
			`# - https://docs.julialang.org/en/v1/manual/performance-tips/`
			`# - https://docs.julialang.org/en/v1/manual/style-guide/`
			`#`
			`# if you care about performance.`


			`# ## Example: A linear advection simulation`
			`#`
			`# This is a classical partial differential equation (PDE) simulation setup.`
			`# If you are not familiar with it, just ignore what's going on - but we need`
			`# an example. This one is similar to several problematic cases I have seen`
			`# in practice.`

			`# First, we generate initial data and store it in a file.`
			`using HDF5`
			`x = range(-1.0, 1.0, length = 1000)`
			`dx = step(x)`
			`h5open("initial_data.h5", "w") do io`
			`u0 = sinpi.(x)`
			`write_dataset(io, "x", collect(x))`
			`write_dataset(io, "u0", u0)`
			`end`

			`# Next, we write our simulation code as a function - as we have learned from`
			`# the performance tips!`
			`function simulate()`
			`x, u0 = h5open("initial_data.h5", "r") do io`
			`read_dataset(io, "x"), read_dataset(io, "u0")`
			`end`

			`t = 0`
			`u = u0`
			`while t < t_end`
			`u = u + dt * rhs(u)`
			`t = t + dt`
			`end`

			`return t, x, u, u0`
			`end`

			`function rhs(u)`
			`du = similar(u)`
			`for i in eachindex(u)`
			`im1 = i == firstindex(u) ? lastindex(u) : (i - 1)`
			`du[i] = -(u[i] - u[im1]) / dx`
			`end`
			`return du`
			`end`

			`# Now, we can define our parameters, run a simulation,`
			`# and plot the results.`
			`using Plots, LaTeXStrings`

			`t_end = 2.5`
			`dt = 0.9 * dx`
			`t, x, u, u0 = simulate()`
			`plot(x, u0; label = L"u_0", xguide = L"x")`
			`plot!(x, u; label = L"u")`

			`# Maybe you can already spot problems in the code above.`
			`# Anyway, before you begin optimizing some code, you should`
			`# test it and make sure it's correct. Let's assume this is the`
			`# case here. You should write tests making sure that the code`
			`# continues to work as expected while we optimize it. We will`
			`# not do this here right now.`


			`# ## Profiling`
			`#`
			`# First, we need to measure the performance of our code to`
			`# see whether it's already reasonable. For this, you can use`
			# `@time` - or better BenchmarkTools.jl.

			`using BenchmarkTools`
			`@benchmark simulate()`

			`# This shows quite a lot of allocations - typically a bad sign`
			`# if you are working with numerical simulations.`

			`# There are also profiling tools available in Julia.`
			`# Some of them are already loaded in the Visual Studio Code`
			`# extension for Julia. If you prefer working in the REPL,`
			# you can install ProfileView.jl (`@profview simulate()`) and
			# PProf.jl (`pprof()` after creating a profile via `@profview`).

			`@profview simulate()`

			`# Task: Optimize the code!`


			`# ## Introduction to generic Julia code and AD`
			`#`
			`# One of the strengths of Julia is that you can use quite a few`
			`# modern tools like AD. However, you need to learn Julia a bit`
			`# to use everything efficiently.`
			`# Here, we concentrate on ForwardDiff.jl.`

			`using ForwardDiff`
			`using Statistics`

			`function foo0(x)`
			`vector = zeros(typeof(x), 100)`
			`foo0!(vector, x)`
			`end`

			`function foo0!(vector, scalar)`
			`for i in eachindex(vector)`
			`vector[i] = atan(i * scalar) / π`
			`end`

			`for _ in 1:1000`
			`for i in eachindex(vector)`
			`vector[i] = cos(vector[i])`
			`end`
			`end`

			`return mean(vector)`
			`end`

			`let x = 2 * π`
			`@show foo0(x)`
			`@show ForwardDiff.derivative(foo0, x)`
			`@benchmark foo0($x)`
			`end`


			`# The code above is basically a fixed point iteration.`
			`# By doing some analysis, one could figure out that it`
			# should converge to the solution `x` of `x == cos(x)`,
			`# the "Dottie number". See https://en.wikipedia.org/wiki/Dottie_number`

			`using SimpleNonlinearSolve`

			`function dottie_number()`
			`f(u, p) = cos(u) - u`
			`bounds = (0.0, 2.0)`
			`prob = IntervalNonlinearProblem(f, bounds)`
			`sol = solve(prob, ITP())`
			`return sol.u`
			`end`

			`dottie_number()`


			`# Next, we introduce a custom struct. Can you spot the problems?`

			`struct MyData1`
			`scalar`
			`vector`
			`end`

			`function foo1(x)`
			`data = MyData1(x, zeros(typeof(x), 100))`
			`foo1!(data)`
			`end`

			`function foo1!(data)`
			`(; scalar, vector) = data`

			`for i in eachindex(vector)`
			`vector[i] = atan(i * scalar) / π`
			`end`

			`for _ in 1:1000`
			`for i in eachindex(vector)`
			`vector[i] = cos(vector[i])`
			`end`
			`end`

			`return mean(vector)`
			`end`

			`let x = 2 * π`
			`@show foo1(x)`
			`@show ForwardDiff.derivative(foo1, x)`
			`@benchmark foo1($x)`
			`end`


			`# We can fix type instabilities by introducing types explicitly.`
			`# But we lose the possibility to use AD this way!`

			`struct MyData2`
			`scalar::Float64`
			`vector::Vector{Float64}`
			`end`

			`function foo2(x)`
			`data = MyData2(x, zeros(typeof(x), 100))`
			`foo1!(data)`
			`end`

			`let x = 2 * π`
			`@show foo2(x)`
			`@benchmark foo2($x)`
			`end`

			`let x = 2 * π`
			`ForwardDiff.derivative(foo2, x)`
			`end`

			`# Thus, we need parametric types!`

			`struct MyData3{T}`
			`scalar::T`
			`vector::Vector{T}`
			`end`

			`function foo3(x)`
			`data = MyData3(x, zeros(typeof(x), 100))`
			`foo1!(data)`
			`end`

			`let x = 2 * π`
			`@show foo3(x)`
			`@show ForwardDiff.derivative(foo3, x)`
			`@benchmark foo3($x)`
			`end`