x = [3., 1.]           # x is a 2-element array of real values 
P = [1 1; 6 1; 6 5];   # P will be converted from integer to real when subtracted from x


x' .- P

3×2 Matrix{Float64}:
  2.0   0.0
 -3.0   0.0
 -3.0  -4.0


(x' .- P).^2

3×2 Matrix{Float64}:
 4.0   0.0
 9.0   0.0
 9.0  16.0


sum((x' .- P).^2, dims = 2)

3×1 Matrix{Float64}:
  4.0
  9.0
 25.0


d = sqrt.(sum((x' .- P).^2, dims = 2))   # dims = 2 => sum each row

3×1 Matrix{Float64}:
 2.0
 3.0
 5.0


dist2(x,P) = sqrt.(sum((x' .- P).^2, dims = 2))
d = dist2(x,P)

3×1 Matrix{Float64}:
 2.0
 3.0
 5.0


@show [x; x]
@show [P P]
d = dist2([x; x],[P P])

[x; x] = [3.0, 1.0, 3.0, 1.0]
[P P] = [1 1 1 1; 6 1 6 1; 6 5 6 5]

3×1 Matrix{Float64}:
 2.8284271247461903
 4.242640687119285
 7.0710678118654755


p = [1, 2, 5, 9]
d = dist2(3.,p)

4-element Vector{Float64}:
 2.0
 1.0
 2.0
 6.0


@show length(x)
@show length(P);

length(x) = 2
length(P) = 6


@show size(P)
@show size(P,1)
@show size(P,2);

size(P) = (3, 2)
size(P, 1) = 3
size(P, 2) = 2


sum(dist2(x,P))

10.0


using Optim
dist2(x,P) = sqrt.(sum((x' .- P).^2, dims = 2))
P = [1 1; 6 1; 6 5]; 
x0 = [0., 0.]
optimize(x -> sum(dist2(x,P)), x0)

 * Status: success

 * Candidate solution
    Final objective value:     8.697184e+00

 * Found with
    Algorithm:     Nelder-Mead

 * Convergence measures
    √(Σ(yᵢ-ȳ)²)/n ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    45
    f(x) calls:    89


res = optimize(x -> sum(dist2(x,P)), x0)
xᵒ = res.minimizer
TDᵒ = res.minimum
@show xᵒ TDᵒ;

xᵒ = [5.089389040930581, 1.9663250607367784]
TDᵒ = 8.697184389632483


xᵒ = optimize(x -> sum(dist2(x,P)), x0).minimizer

2-element Vector{Float64}:
 5.089389040930581
 1.9663250607367784


using Plots
scatter(P[:,1],P[:,2], legend=false)


function f2plot(f,x)
    scatter!([x[1]],[x[2]], markersize=1, markerstrokecolor=:green)
    return f(x)
end
x0 = [0., 0.]
xᵒ = optimize(x -> sum(f2plot(x -> dist2(x,P),x)), x0).minimizer
scatter!([xᵒ[1]],[xᵒ[2]], markersize=4, markercolor=:red)


using Optim, Plots
f(x) = 100(x[2] - x[1]^2)^2 + (1 - x[1])^2   # Using single input argument
xrng = -3:.1:3                               # x-axis range
yrng = -2:.1:5                               # y-axis range
contour(xrng, yrng, (x1,x2) -> f([x1,x2]))   # Using multiple argument anonymous function


x0 = [-2., 2.]
optimize(f, x0)   # Gradient not provided: Nelder-Mead default algorithm

 * Status: success

 * Candidate solution
    Final objective value:     7.355781e-10

 * Found with
    Algorithm:     Nelder-Mead

 * Convergence measures
    √(Σ(yᵢ-ȳ)²)/n ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    132
    f(x) calls:    246


function g!(G, x)
    G[1] = 2. * x[1] - 400. * x[1] * (x[2] - x[1]^2) - 2.
    G[2] = 200. * x[2] - 200. * x[1]^2
end
optimize(f, g!, x0)   # Gradient provided: L-BFGS default algorithm

 * Status: success

 * Candidate solution
    Final objective value:     2.155724e-18

 * Found with
    Algorithm:     L-BFGS

 * Convergence measures
    |x - x'|               = 2.84e-07 ≰ 0.0e+00
    |x - x'|/|x'|          = 2.84e-07 ≰ 0.0e+00
    |f(x) - f(x')|         = 7.97e-13 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 3.70e+05 ≰ 0.0e+00
    |g(x)|                 = 9.34e-09 ≤ 1.0e-08

 * Work counters
    Seconds run:   1  (vs limit Inf)
    Iterations:    33
    f(x) calls:    103
    ∇f(x) calls:   103


optimize(f, x0, LBFGS())   # Gradient approximated using finite differences

 * Status: success

 * Candidate solution
    Final objective value:     5.378404e-17

 * Found with
    Algorithm:     L-BFGS

 * Convergence measures
    |x - x'|               = 2.05e-09 ≰ 0.0e+00
    |x - x'|/|x'|          = 2.05e-09 ≰ 0.0e+00
    |f(x) - f(x')|         = 1.75e-17 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 3.25e-01 ≰ 0.0e+00
    |g(x)|                 = 4.05e-12 ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    36
    f(x) calls:    108
    ∇f(x) calls:   108


optimize(f, g!, x0, ConjugateGradient())   # Using Conjugate Gradient algorithm

 * Status: success

 * Candidate solution
    Final objective value:     1.838688e-18

 * Found with
    Algorithm:     Conjugate Gradient

 * Convergence measures
    |x - x'|               = 4.31e-10 ≰ 0.0e+00
    |x - x'|/|x'|          = 4.31e-10 ≰ 0.0e+00
    |f(x) - f(x')|         = 1.53e-17 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 8.32e+00 ≰ 0.0e+00
    |g(x)|                 = 2.99e-09 ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    34
    f(x) calls:    83
    ∇f(x) calls:   58


function h!(H, x)
    H[1,1] = 1200. * x[1]^2 - 400. * x[2] + 2
    H[1,2] = -400. * x[1]
    H[2,1] = -400. * x[1]
    H[2,2] = 200.
end
optimize(f, g!, h!, x0, NewtonTrustRegion())   # Gradient and Hessian provided

 * Status: success

 * Candidate solution
    Final objective value:     6.271614e-20

 * Found with
    Algorithm:     Newton's Method (Trust Region)

 * Convergence measures
    |x - x'|               = 5.98e-06 ≰ 0.0e+00
    |x - x'|/|x'|          = 5.98e-06 ≰ 0.0e+00
    |f(x) - f(x')|         = 2.61e-11 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 4.16e+08 ≰ 0.0e+00
    |g(x)|                 = 2.61e-09 ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    30
    f(x) calls:    31
    ∇f(x) calls:   31
    ∇²f(x) calls:  27


optimize(f, x0, NewtonTrustRegion(), autodiff = :forward)  # No gradient/Hessian provided

 * Status: success

 * Candidate solution
    Final objective value:     6.271440e-20

 * Found with
    Algorithm:     Newton's Method (Trust Region)

 * Convergence measures
    |x - x'|               = 5.98e-06 ≰ 0.0e+00
    |x - x'|/|x'|          = 5.98e-06 ≰ 0.0e+00
    |f(x) - f(x')|         = 2.61e-11 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 4.16e+08 ≰ 0.0e+00
    |g(x)|                 = 2.61e-09 ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    30
    f(x) calls:    31
    ∇f(x) calls:   31
    ∇²f(x) calls:  27


contour(xrng, yrng, (x1,x2) -> f([x1,x2]), legend=false, xlims=(-3,3), ylims=(-2,5))
res = optimize(x -> f2plot(f,x), x0)
str = "\\nNelder-Mead: " * string(res.f_calls) * " function calls\\n"
scatter!([res.minimizer[1]],[res.minimizer[2]],markersize=4,markercolor=:red,title=str)


contour(xrng, yrng, (x1,x2) -> f([x1,x2]), legend=false, xlims=(-3,3), ylims=(-2,5))
res = optimize(x -> f2plot(f,x), g!, x0, ConjugateGradient())
str = "\\nConjugate Gradient w grad: " * string(res.f_calls) * " function calls\\n"
scatter!([res.minimizer[1]],[res.minimizer[2]],markersize=4,markercolor=:red,title=str)


contour(xrng, yrng, (x1,x2) -> f([x1,x2]), legend=false, xlims=(-3,3), ylims=(-2,5))
res = optimize(x -> f2plot(f,x), g!, h!, x0, NewtonTrustRegion())
str = "\\nNewton w grad + Hessian: " * string(res.f_calls) * " function calls\\n"
scatter!([res.minimizer[1]],[res.minimizer[2]],markersize=4,markercolor=:red,title=str)


using Optim, Plots
f(x) = 12x[1]^2 + 4x[2]^2 - 12x[1]*x[2] + 2x[1]
xrng = -3:.1:3                               # x-axis range
yrng = -3:.1:3                               # y-axis range
contour(xrng, yrng, (x1,x2) -> f([x1,x2]))   # Using multiple argument anonymous function


x0 = [0., 0.]
res = optimize(f, x0)

 * Status: success

 * Candidate solution
    Final objective value:     -3.333333e-01

 * Found with
    Algorithm:     Nelder-Mead

 * Convergence measures
    √(Σ(yᵢ-ȳ)²)/n ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    33
    f(x) calls:    68


res.minimizer

2-element Vector{Float64}:
 -0.33336029354864666
 -0.5000221244148185


x0 = [0., 0.]
optimize(f, x0, ConjugateGradient())

 * Status: success

 * Candidate solution
    Final objective value:     -3.333333e-01

 * Found with
    Algorithm:     Conjugate Gradient

 * Convergence measures
    |x - x'|               = 5.00e-01 ≰ 0.0e+00
    |x - x'|/|x'|          = 1.00e+00 ≰ 0.0e+00
    |f(x) - f(x')|         = 2.50e-01 ≰ 0.0e+00
    |f(x) - f(x')|/|f(x')| = 7.50e-01 ≰ 0.0e+00
    |g(x)|                 = 1.83e-10 ≤ 1.0e-08

 * Work counters
    Seconds run:   0  (vs limit Inf)
    Iterations:    2
    f(x) calls:    5
    ∇f(x) calls:   4


x = [121, 143, 63, 80, 198, 52, 160, 162, 85, 106, 129, 141, 106]      # Dose
y = [237, 214, 161, 146, 331, 159, 423, 332, 139, 327, 152, 98, 116]   # Response
using Plots 
scatter(x, y, legend=false, xlabel="Dose", ylabel="Response", label="(x, y)")


using Statistics
cor(x,y)

0.5994685344117657


fŷ(α,x) = α[1] .+ α[2]x                           # Linear model
fL2(α) = sum((fŷ(α,x) .- y).^2)                   # L2 loss function 
using Optim
αᵒ = optimize(fL2, [0., 1.]).minimizer            # Starting α values = [0., 1.]

2-element Vector{Float64}:
 44.86442369548186
  1.4565087918592914


plot!(x -> fŷ(αᵒ,x), 0, maximum(x), label="L2")


fL1(α) = sum(abs.(fŷ(α,x) .- y))                  # L1 loss function 
αᵒ = optimize(fL1, [0., 1.]).minimizer
plot!(x -> fŷ(αᵒ,x), 0, maximum(x), label="L1",legend=true)


x1, x2 = [1, 2, 6], [1, 2, 12]
@show sum(x1) sum(x2) 
@show mean(x1),3*mean(x1) mean(x2),3*mean(x2) 
@show median(x1),3*median(x1) median(x2),3*median(x2);

sum(x1) = 9
sum(x2) = 15
(mean(x1), 3 * mean(x1)) = (3.0, 9.0)
(mean(x2), 3 * mean(x2)) = (5.0, 15.0)
(median(x1), 3 * median(x1)) = (2.0, 6.0)
(median(x2), 3 * median(x2)) = (2.0, 6.0)


using DataFrames
df = DataFrame(Name = "Mike", Age = 44)


push!(df,("Bill",40))


df = DataFrame(Name = ["Mike","Bill"], Age = [44, 40])


name = df.Name

2-element Vector{String}:
 "Mike"
 "Bill"


df.Age

2-element Vector{Int64}:
 44
 40


df[2,:]


df[2,"Name"]

"Bill"


using DataFrames, CSV
df = DataFrame(CSV.File("NL_Opt-2-Data.csv"))


df.Dose

13-element Vector{Int64}:
 121
 143
  63
  80
 198
  52
 160
 162
  85
 106
 129
 141
 106


@show x, y = df.Dose, df.Response;   # Assign to arrays

(x, y) = (df.Dose, df.Response) = ([121, 143, 63, 80, 198, 52, 160, 162, 85, 106, 129, 141, 106], [237, 214, 161, 146, 331, 159, 423, 332, 139, 327, 152, 98, 116])


scatter(x, y, legend=false, xlabel="Dose", ylabel="Response")

NL Opt 2: Multivariate Optimization¶

1. Gradient-free Optimization¶

Ex 1: Euclidean 2-D distances¶

Ex 2: Minimum-distance location¶

Nelder-Mead Method¶

2. Gradient-based Optimization¶

Ex 3: Rosenbrock's Banana Function¶

Ex 4: Cantilever Beam Design¶

3. Regression¶

Ex 5: Dose-Response Relationship of a Medication¶

MSE vs. MAD¶

4. DataFrames¶

Reading Data from a CSV File¶

	Dose	Response
	Int64	Int64
1	121	237
2	143	214
3	63	161
4	80	146
5	198	331
6	52	159
7	160	423
8	162	332
9	85	139
10	106	327
11	129	152
12	141	98
13	106	116

	Name	Age
	String	Int64
1	Mike	44

	Name	Age
	String	Int64
1	Mike	44
2	Bill	40

	Name	Age
	String	Int64
1	Mike	44
2	Bill	40

	Name	Age
	String	Int64
2	Bill	40