# Dual numbers, invented by Clifford in 1873.  \bbiD

struct ⅅ <: Number
    a :: Float64
    b :: Float64
end


import Base: +,-,*,/

z1::ⅅ + z2::ⅅ = ⅅ(z1.a + z2.a, z1.b + z2.b)
z1::ⅅ - z2::ⅅ = ⅅ(z1.a - z2.a, z1.b - z2.b)
z1::ⅅ * z2::ⅅ = ⅅ(z1.a * z2.a, z1.a * z2.b + z1.b * z2.a) 
z1::ⅅ / z2::ⅅ = ⅅ(z1.a / z2.a, (z2.a * z1.b - z1.a * z2.b)/z2.a^2) 


# Regeln für elementare Funktionen, kleine Auswahl 
import Base: sin, log
sin(z::ⅅ) = ⅅ(sin(z.a), cos(z.a) * z.b)
log(z::ⅅ) = ⅅ(log(z.a), 1/z.a * z.b)

Base.convert(::Type{ⅅ}, x::Real) = ⅅ(x, zero(x))
Base.promote_rule(::Type{ⅅ}, ::Type{<:Number}) = ⅅ


# Der Ableitungsoperator: berechnet den Wert f'(x) an der Stelle x

∂(f, x) = f(ⅅ(x, 1)).b

∂ (generic function with 1 method)


# Zum testen

f(x) = 4x^2 + 2x + 5sin(3x) 

# Ableitung
fp(x) = 8x   + 2 + 15cos(3x)

fp (generic function with 1 method)


@show f(ⅅ(5,1))  f(5) fp(5);

f(ⅅ(5, 1)) = ⅅ(113.25143920078558, 30.60468130711768)
f(5) = 113.25143920078558
fp(5) = 30.60468130711768


∂(f,5)

30.60468130711768


# Implementation von 1dim Newton, 
# f' wird durch Arithmetik dualer Zahlen berechnet


function Newton1(fct, x0; MaxIter = 50, Eps = 1.e-14)
    xold = x0
    i = 0
    while true
        i += 1
        if i > MaxIter
            println(stderr, "Max number of iterations reached without convergence, stop")
            return 
        end
        f = fct( ⅅ(xold, 1) )    # Das liefert  f(xold) und f'(xold)
        
        xnew = xold - f.a/f.b
        println(i," ", xnew)
        if abs(xnew-xold) < Eps
            return xnew
        end
        xold = xnew
    end
end

Newton1 (generic function with 1 method)


Newton1(x-> 2-x^2, 1)

1 1.5
2 1.4166666666666667
3 1.4142156862745099
4 1.4142135623746899
5 1.4142135623730951
6 1.414213562373095

1.414213562373095


x = Newton1(x->2-x^3, 2)    # 3. Wurzel 2

1 1.5
2 1.2962962962962963
3 1.2609322247417485
4 1.2599218605659261
5 1.2599210498953948
6 1.2599210498948732
7 1.2599210498948732

1.2599210498948732

x^3

2.0


using ForwardDiff, # hessian, gradient
    LinearAlgebra, # norm of arrays
    Plots


"""
Mehrdimensionale Extremwertsuche mittels Newton-Verfahren,
F:       Funktion eines n-vektors
x0vec:   n-Vektor der Startwerte
MaxIter: max. Anzahl von Iterationen
Eps:     Ziel erreicht, wenn Verbesserung in der Vektornorm ||x_neu-x_alt|| < Eps 

Zur späteren Visualisierung werden die m Vektoren  
(m = Anzahl der benötigten Iterationsschritte) 
als nxm-Matrix zurückgegeben.  
"""
function NewtonOpti(F, x0vec; MaxIter = 50, Eps = 1.e-14)
    Xs = copy(x0vec)
    xold = x0vec
    i = 0
    while true
        i += 1
        if i > MaxIter
            println(stderr, "Max number of iterations reached without convergence, stop.")
            return
        end
        H = ForwardDiff.hessian(F, xold)
        del = H \ ForwardDiff.gradient(F, xold)
        xnew = xold -  del
        Xs = hcat(Xs, xnew)
        println(xnew)   
        if norm(del) < Eps
            println("Extremum reached after $i iterations at $xnew")
            return Xs
        end
        xold = xnew
    end
end

NewtonOpti


# unsere 2-dimensionale Testfunktion

function f(x,y) 
    z = (1. - x/2 + x^5 + y^3) * exp(-x^2 - y^2)
    return z
end

# und jetzt mit Vektor-Argument, wie es in ForwardDiff 
# und damit in NewtonOpti() gebraucht wird:

function F(xvec)
    return f(xvec[1], xvec[2])
end

F (generic function with 1 method)


# so sieht sie aus:


surface( -3:0.02:3, -3:0.02:3,  f)


# im Contourplot sieht man die Minima und Maxima

contour( -3:0.02:3, -3:0.02:3,  f, fill=true, c=:Blues, levels=20, contour_labels=false)


# und los gehts: 

xs = NewtonOpti(F, [2.,0.1])

[0.1332054959300537, -0.290375646177925]
[-0.5092885621074995, 0.08142783320806135]
[-0.24479556529773994, -0.03277048936762038]
[-0.22026161325055604, -0.0011927350354439467]
[-0.22004307520481325, -1.91323696826411e-6]
[-0.22004305442098376, -4.94875303235653e-12]
[-0.2200430544209836, -3.310822713486171e-23]
[-0.22004305442098357, 0.0]
Extremum reached after 8 iterations at [-0.22004305442098357, 0.0]

2×9 Matrix{Float64}:
 2.0   0.133205  -0.509289   -0.244796   …  -0.220043     -0.220043
 0.1  -0.290376   0.0814278  -0.0327705     -3.31082e-23   0.0


# .. wir zeichen die Schritte des Nowton-verfahrens hin zum 
# gefundenen Maximum ein:

plot!(xs[1,:], xs[2,:], marker=:circle, markersize=5)


# wir kombinieren gleich Berechnung und Visualisierung 
# und bauen die Möglichkeit ein, 
# Ausschnitte mit den Grenzen [(x1,x2),(y1,y2)] zu plotten

function MakePlot(x0; x1=-3, x2=3, y1=-3, y2=3)
    xs = NewtonOpti(F, x0)
    p = contour( range(x1,x2,300), range(y1,y2,300),  f, fill=true, c=:Blues, levels=20, 
        contour_labels=false)
    plot!(xs[1,:], xs[2,:], marker=:circle, markersize=5, linesize=2)
end

MakePlot (generic function with 1 method)


# und das obige Bild nochmal im Ausschnitt
# ... Interesanterweise geht der erste Iterationsschritt am nächstgelegenem 
# Maximum vorbei und das Verfahren läuft zum anderen Maximum...


MakePlot([2,.1], x1=-1.3, x2=2.5, y1=-.5, y2=.3)

[0.1332054959300537, -0.290375646177925]
[-0.5092885621074995, 0.08142783320806135]
[-0.24479556529773994, -0.03277048936762038]
[-0.22026161325055604, -0.0011927350354439467]
[-0.22004307520481325, -1.91323696826411e-6]
[-0.22004305442098376, -4.94875303235653e-12]
[-0.2200430544209836, -3.310822713486171e-23]
[-0.22004305442098357, 0.0]
Extremum reached after 8 iterations at [-0.22004305442098357, 0.0]


MakePlot([1,0.1])

[0.6956106547605012, 0.03171439130151904]
[0.7920383277477394, -0.0004734597583571504]
[0.7890525789862474, -3.9117647761667627e-7]
[0.7890542734775248, -2.518659773261041e-13]
[0.7890542734780247, -1.044578056257455e-25]
[0.7890542734780247, 0.0]
Extremum reached after 6 iterations at [0.7890542734780247, 0.0]


# ..und diesmal treffen wir den Saddelpunkt. 
# da verschwinden natürlich auch alle partiellen Ableitungen

MakePlot([1,0.1], x1=0.5, x2=1.2, y1=-.2, y2=.2)

[0.6956106547605012, 0.03171439130151904]
[0.7920383277477394, -0.0004734597583571504]
[0.7890525789862474, -3.9117647761667627e-7]
[0.7890542734775248, -2.518659773261041e-13]
[0.7890542734780247, -1.044578056257455e-25]
[0.7890542734780247, 0.0]
Extremum reached after 6 iterations at [0.7890542734780247, 0.0]


# mit diesem Startwert geht's zu einem der Minima

MakePlot( [-1.8,0.2])

[-1.6584806215974253, -0.03160877603265452]
[-1.6881945075073073, 0.0003759256128861993]
[-1.6888385202356129, 1.696332552631732e-8]
[-1.688838885976237, 3.627747814500337e-17]
[-1.6888388859763552, 0.0]
[-1.6888388859763555, 0.0]
Extremum reached after 6 iterations at [-1.6888388859763555, 0.0]


#nochmal als Ausschnitt

MakePlot([-1.8,.2], x1=-2, x2=-1.4, y1=-.4, y2=.3)

[-1.6584806215974253, -0.03160877603265452]
[-1.6881945075073073, 0.0003759256128861993]
[-1.6888385202356129, 1.696332552631732e-8]
[-1.688838885976237, 3.627747814500337e-17]
[-1.6888388859763552, 0.0]
[-1.6888388859763555, 0.0]
Extremum reached after 6 iterations at [-1.6888388859763555, 0.0]


# und mit diesem Startwert erreichen wir auch das rechte Maximum

MakePlot([1.3,0.2])

[1.7495598911691388, -0.1481347995568894]
[1.4979885189593156, 0.03284641414014772]
[1.5486102113661622, -0.0006009360354399529]
[1.5477195717036256, -5.706673652540722e-8]
[1.5477195171353288, -5.36382925634516e-16]
[1.5477195171353284, -9.860761315262648e-32]
Extremum reached after 6 iterations at [1.5477195171353284, -9.860761315262648e-32]


# nochmal als Ausschnitt

MakePlot([1.3,.2], x1=1.1, x2=2, y1=-.2, y2=.3)

[1.7495598911691388, -0.1481347995568894]
[1.4979885189593156, 0.03284641414014772]
[1.5486102113661622, -0.0006009360354399529]
[1.5477195717036256, -5.706673652540722e-8]
[1.5477195171353288, -5.36382925634516e-16]
[1.5477195171353284, -9.860761315262648e-32]
Extremum reached after 6 iterations at [1.5477195171353284, -9.860761315262648e-32]

Newton-Verfahren und automatische Differentiation¶

Banachscher Fixpunktsatz¶

Newton-Verfahren zur Nullstellensuche einer Funktion $f(x)$¶

Newton-Verfahren zur Nullstellensuche eines nichtlinearen Gleichungssystems¶

Automatisches Differenzieren¶

Duale Zahlen¶

Newton-Verfahren in der Optimierung¶

Das Paket ForwardDiff.jl¶