add test for Gauss-Newton

inverseproblem · inverseproblem · commit 4710daa102bc · 2025-03-05T10:40:41.000+01:00
diff --git a/.github/workflows/documentation.yml b/.github/workflows/documentation.yml
@@ -1,14 +1,18 @@
-name: Documentation
+name: Build documentation
 
 on:
   push:
     branches:
       - main # update to match your development branch (master, main, dev, trunk, ...)
-    tags: '*'
+      - develop
+    tags:
+      - 'v*'
   pull_request:
+    branches:
+      - develop
 
 jobs:
-  build:
+  build_docs:
     permissions:
       actions: write
       contents: write
@@ -20,7 +24,9 @@ jobs:
       - uses: julia-actions/setup-julia@v2
         with:
           version: '1'
-      - uses: julia-actions/cache@v2  # reduce GitHub Actions running time
+      - name: Julia cache
+        if: ${{ !env.ACT }}
+        uses: julia-actions/cache@v2
       - name: Install dependencies
         run: julia --project=docs/ -e 'using Pkg; Pkg.develop(PackageSpec(path=pwd())); Pkg.instantiate()'
       - name: Build docs and deploy
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
@@ -0,0 +1,48 @@
+name: Package tests
+
+on: 
+  push:
+    branches:
+      - main
+      - develop
+    tags: '*'
+  pull_request:
+    branches:
+      - develop
+    types:
+      - ready_for_review
+      - synchronize
+
+# needed to allow julia-actions/cache to delete old caches that it has created
+permissions:
+  actions: write
+  contents: read
+
+jobs:
+  run_tests:
+    name: Julia ${{ matrix.julia-version }} - ${{ matrix.os }} - ${{ matrix.arch }}
+    runs-on: ${{ matrix.os }}
+    if : github.event.pull_request.draft == false
+    strategy:
+      matrix:
+        julia-version: ['1'] #['lts', '1', 'pre']
+        arch: [x64] #[x64, x86]
+        os: [ubuntu-latest, macOS-latest] #[ubuntu-latest, windows-latest, macOS-latest]
+        include:
+          - os: macOS-latest
+            julia-version: '1'
+            arch: aarch64
+            
+    steps:
+      - uses: actions/checkout@v4
+      - uses: julia-actions/setup-julia@v2
+        with:
+          version: ${{ matrix.julia-version }}
+          arch: ${{ matrix.arch }}
+      - name: Julia cache
+        if: ${{ !env.ACT }}
+        uses: julia-actions/cache@v2
+      - uses: julia-actions/julia-buildpkg@v1
+      - uses: julia-actions/julia-runtest@v1
+        # with:
+        #   annotate: true
diff --git a/src/Optimizers/GaussNewton/gauss_newton.jl b/src/Optimizers/GaussNewton/gauss_newton.jl
@@ -57,6 +57,8 @@ function gaussnewton(calcfwd!::Function,
     end
     @assert length(xprior)==length(x0)
 
+    @info "\n*** Gauss-Newton optimization  *** "
+
     ## init
     N = size(invCd,1)
     M = length(x0)
@@ -92,8 +94,8 @@ function gaussnewton(calcfwd!::Function,
         res_m .= xcur - xprior
         objval += 0.5 * dot(res_m,invCm,res_m)
         ##=======================
-        #    Gradient
-        # Jtres = J*res, i.e., the gradient
+        #   Gradient
+        #  grad = J^T * Cd^-1 * res_d + Cm^-1 * res_m
         mul!(tmpgr_d,invCd,res_d)
         mul!(grad,transpose(jac),tmpgr_d)
         mul!(tmpgr_m,invCm,res_m)
@@ -116,14 +118,15 @@ function gaussnewton(calcfwd!::Function,
     #   and get the in-place jacobian as an optional argument
     misf[1] = fh!(grad,x[1])
     g0norm = norm(grad)
-    
+
+    @info "Initial misfit $(misf[1])     "
     ## Loop
     for k=1:maxiter
      
         ##===============================
         # Jacobian
         calcjac!(jac,x[k])
-        # Now (J^T*invCd*J + invCm) p_gn = - (J^T*invCm) *res
+        # Now (J^T*invCd*J + invCm) p_gn = - (J^T*invCd) *res
         # invCd * J
         mul!(invCd_J,invCd,jac)
         # temporary store invCm in the Hessian array
@@ -132,13 +135,15 @@ function gaussnewton(calcfwd!::Function,
         #  J^T * invCd * J + invCm
         mul!(H,transpose(jac),invCd_J,1.0,1.0)
         # solve linear system
-        faJtJ = factorize(Symmetric(H))
-        # J^t*J*p_gn = -J^t*res
-        #  pkgn is the descent direction
+        #faJtJ = factorize(Symmetric(H)) # this seems to get singular...
+        faJtJ = lu(H) 
+        ## (J^T*invCd*J + invCm) p_gn = - (J^T*invCd) *res
+        ##  pkgn is the descent direction
         ldiv!(pkgn,faJtJ,-grad)
+        ##===============================
 
         ##===============================
-        # Line search
+        ## Line search
         if k==1
             α0 = target_update
         else
@@ -150,10 +155,10 @@ function gaussnewton(calcfwd!::Function,
                                                α0=α0,maxiterwolfe=maxiterwolfe,
                                                maxiterzoom=maxiterzoom,
                                                c1=c1,c2=c2)
-
-        ##===============================
         # Update the solution
-        x[k+1] .= x0αp #x[k] .+ α.*pkgn
+        x[k+1] .= x0αp   ###x[k] .+ α.*pkgn
+        ##===============================
+
 
         if bounds!=nothing
             # project x[k+1]
diff --git a/test/runtests.jl b/test/runtests.jl
@@ -27,17 +27,29 @@ with_logger(logger) do
         @test test_bfgs2()
 
     end
+
+    @testset "Test Gauss-Newton algo" begin
+
+        printstyled("Gauss-Newton: Test 1\n", bold=true,color=:cyan)
+        @test test_gaussnewton1()
+        
+        printstyled("Gauss-Newton: Test 2\n", bold=true,color=:cyan)
+        @test test_gaussnewton2()
+
+        printstyled("Gauss-Newton: Test 3\n", bold=true,color=:cyan)
+        @test test_gaussnewton3()
+    end
 end
 
 
 # KronLinInv
 @testset "Test KronLinInv" begin
 
     printstyled("KronLinInv: Testing 2D example \n", bold=true,color=:cyan)
-    @test test2D()
+    @test test_KLI2D()
 
     printstyled("KronLinInv: Testing 3D example \n", bold=true,color=:cyan)
-    @test test3D()
+    @test test_KLI3D()
 
     println()
 end
diff --git a/test/test_gaussnewton.jl b/test/test_gaussnewton.jl
@@ -0,0 +1,148 @@
+
+
+using LinearAlgebra
+## using GLMakie
+
+
+function test_gaussnewton1()
+
+    tval = −2.903534
+    tvec = [tval,tval] # location of the minimum
+    stmin = -39.16617*length(tvec) # value at the minimum
+  
+    function calcfwd!(u,x)
+        u .= styblinskitang(x)
+        return 
+    end
+
+    function calcjac!(g,x)
+        g[1,:] .= ∇styblinskitang(x)
+        return 
+    end
+    
+    xprior = [-0.5,-4.5]
+
+    obsdata = [stmin]
+    invCd = [1.0;;]
+    invCm = [0.0   0;
+             0   0.0]
+
+    maxiter = 30
+
+    xout,misfout = gaussnewton(calcfwd!,calcjac!,
+                               obsdata=obsdata,
+                               invCd=invCd,
+                               invCm=invCm,
+                               xprior=xprior,
+                               maxiter=maxiter)
+
+    ce1 =isapprox(xout[end],tvec,rtol=1e-2)
+    return ce1 
+end
+
+function test_gaussnewton2()
+
+    # generate function
+    function fwd(a::Real,b::Real,x::Vector{Float64})
+        return a.*x./(b.+x)
+    end
+
+    function calcfwd!(u,m)
+        u .= fwd(m[1],m[2],x)
+        return nothing
+    end
+
+    function calcjac!(jac,m)
+        aj = m[1]
+        bj = m[2]
+        grad_a = x ./ (bj.+x) 
+        grad_b = - ((aj.*x) ./ ((bj .+ x).^2))
+        jac .= [grad_a grad_b]
+        return
+    end
+    
+
+    a,b = 2,3
+    x = collect(range(0,5,length=25))
+    y = fwd(a,b,x) 
+
+    ab0 = [1.0,5.0]
+    xprior = copy(ab0)
+    obsdata = y
+    invCd = diagm(1.0 .* ones(length(obsdata)))
+    invCm = diagm(0.0 .* ones(length(ab0)))
+    
+    maxiter = 30
+
+    xout,misfout = gaussnewton(calcfwd!,calcjac!,
+                               obsdata=obsdata,
+                               invCd=invCd,invCm=invCm,
+                               xprior=xprior,maxiter=maxiter,
+                               target_update=3.0)
+
+    ce1 = xout[end] ≈ [a,b]
+    return ce1
+end
+    
+
+function test_gaussnewton3()
+  
+    function calcfwd!(u,x)
+        u .= sum(x.^2)
+        return 
+    end
+
+    function calcjac!(J,x)
+        J[1,:] .= 2 .* x
+        return 
+    end
+    
+    xprior = [10.0,-13.5]
+
+    obsdata = [0.0]
+    invCd = [1.0;;]
+    invCm = [0.0   0;
+             0   0.0]
+
+    maxiter = 50
+
+    xout,misfout = gaussnewton(calcfwd!,calcjac!,
+                               obsdata=obsdata,
+                               invCd=invCd,
+                               invCm=invCm,
+                               xprior=xprior,
+                               maxiter=maxiter)
+
+    # N = size(invCd,1)
+    # M = length(xprior)
+    # u_calc = zeros(eltype(xprior),N)
+    # grad = zeros(eltype(xprior),M)
+    # jac = zeros(eltype(xprior),N,M) 
+    
+    # function fh_bfgs!(grad,xcur)
+    #     # Calculated data
+    #     calcfwd!(u_calc,xcur)
+    #     # Jacobian
+    #     calcjac!(jac,xcur)
+    #     ##=======================
+    #     #   Value of objective function
+    #     # misfit
+    #     res_d = u_calc - obsdata
+    #     objval = 0.5 * dot(res_d,invCd,res_d)
+    #     # prior term
+    #     res_m = xcur - xprior
+    #     objval += 0.5 * dot(res_m,invCm,res_m)
+    #     grad .= transpose(jac) * invCd * res_d + invCm * res_m
+    #     return objval
+    # end
+    
+    # xout_bfgs,misfout_bfgs = lmbfgs(fh_bfgs!,
+    #                                 xprior,
+    #                                 mem=20,
+    #                                 maxiter=maxiter)
+    # @show xout[end]
+    # @show xout_bfgs[end]
+
+    ce1 = isapprox(xout[end],[0.0,0.0],atol=1e-1)
+    return ce1 
+end
diff --git a/test/test_kronlininv.jl b/test/test_kronlininv.jl
@@ -3,7 +3,7 @@
 
 ###############################################
 
-function test2D( )
+function test_KLI2D( )
 
     ## 2D problem, so set nx = 1
     nx = 1
@@ -26,7 +26,7 @@ end
 
 #########################################
 
-function test3D( )
+function test_KLI3D( )
 
     ## 2D problem, so set nx = 1
     nx = 8