path way to 3D variational stokes

PTsolvers · Nov 29, 2024 · dc88598 · dc88598
1 parent f1f3d2c
commit dc88598
Show file tree

Hide file tree

Showing 7 changed files with 835 additions and 54 deletions.
diff --git a/src/stress_rotation/stress_rotation_particles.jl b/src/stress_rotation/stress_rotation_particles.jl
@@ -3,8 +3,8 @@ using StaticArrays
 # Vorticity tensor
 
 @parallel_indices (I...) function compute_vorticity!(ωxy, Vx, Vy, _dx, _dy)
-    @inline dx(A) = _d_xa(A, I..., _dx)
-    @inline dy(A) = _d_ya(A, I..., _dy)
+    @inline dx(A) = _d_xa(A, _dx, I...)
+    @inline dy(A) = _d_ya(A, _dy, I...)
 
     ωxy[I...] = 0.5 * (dx(Vy) - dy(Vx))
 
@@ -14,9 +14,9 @@ end
 @parallel_indices (I...) function compute_vorticity!(
     ωyz, ωxz, ωxy, Vx, Vy, Vz, _dx, _dy, _dz
 )
-    dx(A) = _d_xa(A, I..., _dx)
-    dy(A) = _d_ya(A, I..., _dy)
-    dz(A) = _d_za(A, I..., _dz)
+    dx(A) = _d_xa(A, _dx, I...)
+    dy(A) = _d_ya(A, _dy, I...)
+    dz(A) = _d_za(A, _dz, I...)
 
     if all(I .≤ size(ωyz))
         ωyz[I...] = 0.5 * (dy(Vz) - dz(Vy))

diff --git a/src/variational_stokes/MiniKernels.jl b/src/variational_stokes/MiniKernels.jl
@@ -10,29 +10,66 @@ end
 # finite differences
 Base.@propagate_inbounds @inline _d_xa(A::T, ϕ::T, _dx, I::Vararg{Integer,N}) where {N,T} =
     (-center(A, ϕ, I...) + right(A, ϕ, I...)) * _dx
+
 Base.@propagate_inbounds @inline _d_ya(A::T, ϕ::T, _dy, I::Vararg{Integer,N}) where {N,T} =
     (-center(A, ϕ, I...) + front(A, ϕ, I...)) * _dy
+
 Base.@propagate_inbounds @inline _d_za(A::T, ϕ::T, _dz, I::Vararg{Integer,N}) where {N,T} =
     (-center(A, ϕ, I...) + front(A, ϕ, I...)) * _dz
+
 Base.@propagate_inbounds @inline _d_xi(A::T, ϕ::T, _dx, I::Vararg{Integer,N}) where {N,T} =
     (-front(A, ϕ, I...) + next(A, ϕ, I...)) * _dx
+
 Base.@propagate_inbounds @inline _d_yi(A::T, ϕ::T, _dy, I::Vararg{Integer,N}) where {N,T} =
     (-right(A, ϕ, I...) + next(A, ϕ, I...)) * _dy
 
-# averages
+Base.@propagate_inbounds @inline _d_zi(A::T, ϕ::T, _dz, I::Vararg{Integer,N}) where {N,T} =
+    (-top(A, ϕ, I...) + next(A, ϕ, I...)) * _dz
+
+# averages 2D
 Base.@propagate_inbounds @inline _av(A::T, ϕ::T, i, j) where {T<:T2} =
     0.25 * mysum(A, ϕ, (i + 1):(i + 2), (j + 1):(j + 2))
+
 Base.@propagate_inbounds @inline _av_a(A::T, ϕ::T, i, j) where {T<:T2} =
     0.25 * mysum(A, ϕ, (i):(i + 1), (j):(j + 1))
+
 Base.@propagate_inbounds @inline _av_xa(A::T, ϕ::T, I::Vararg{Integer,2}) where {T<:T2} =
     (center(A, ϕ, I...) + right(A, ϕ, I...)) * 0.5
+
 Base.@propagate_inbounds @inline _av_ya(A::T, ϕ::T, I::Vararg{Integer,2}) where {T<:T2} =
     (center(A, ϕ, I...) + front(A, ϕ, I...)) * 0.5
+
 Base.@propagate_inbounds @inline _av_xi(A::T, ϕ::T, I::Vararg{Integer,2}) where {T<:T2} =
     (front(A, ϕ, I...), next(A, ϕ, I...)) * 0.5
+
 Base.@propagate_inbounds @inline _av_yi(A::T, ϕ::T, I::Vararg{Integer,2}) where {T<:T2} =
     (right(A, ϕ, I...), next(A, ϕ, I...)) * 0.5
 
+# averages 3D
+Base.@propagate_inbounds @inline _av(A::T, ϕ::T, i, j, k) where {T<:T3} =
+    0.125 * mysum(A, ϕ, (i + 1):(i + 2), (j + 1):(j + 2), (k + 1):(k + 2))
+
+Base.@propagate_inbounds @inline _av_a(A::T, ϕ::T, i, j, k) where {T<:T3} =
+    0.125 * mysum(A, ϕ, (i):(i + 1), (j):(j + 1), (k):(k + 1))
+
+Base.@propagate_inbounds @inline _av_xa(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (center(A, ϕ, I...) + right(A, ϕ, I...)) * 0.5
+
+Base.@propagate_inbounds @inline _av_ya(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (center(A, ϕ, I...) + front(A, ϕ, I...)) * 0.5
+
+Base.@propagate_inbounds @inline _av_za(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (center(A, ϕ, I...) + top(A, ϕ, I...)) * 0.5
+
+Base.@propagate_inbounds @inline _av_xi(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (front(A, ϕ, I...), next(A, ϕ, I...)) * 0.5
+
+Base.@propagate_inbounds @inline _av_yi(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (right(A, ϕ, I...), next(A, ϕ, I...)) * 0.5
+
+Base.@propagate_inbounds @inline _av_zi(A::T, ϕ::T, I::Vararg{Integer,3}) where {T<:T3} =
+    (top(A, ϕ, I...) + next(A, ϕ, I...)) * 0.5
+
 ## Because mysum(::generator) does not work inside CUDA kernels...
 @inline mysum(A, ϕ, ranges::Vararg{T,N}) where {T,N} = mysum(identity, A, ϕ, ranges...)
 

diff --git a/src/variational_stokes/Stokes2D.jl b/src/variational_stokes/Stokes2D.jl
@@ -81,9 +81,6 @@ function _solve_VS!(
     compute_viscosity!(stokes, phase_ratios, args, rheology, air_phase, viscosity_cutoff)
     displacement2velocity!(stokes, dt, flow_bcs)
 
-    @parallel (@idx ni .+ 1) multi_copy!(@tensor(stokes.τ_o), @tensor(stokes.τ))
-    @parallel (@idx ni) multi_copy!(@tensor_center(stokes.τ_o), @tensor_center(stokes.τ))
-
     while iter ≤ iterMax
         iterMin < iter && err < ϵ && break
 
@@ -100,7 +97,7 @@ function _solve_VS!(
                 stokes.∇V,
                 ητ,
                 rheology,
-                phase_ratios.center,
+                phase_ratios,
                 dt,
                 r,
                 θ_dτ,
@@ -213,6 +210,9 @@ function _solve_VS!(
     # accumulate plastic strain tensor
     @parallel (@idx ni) accumulate_tensor!(stokes.EII_pl, @tensor_center(stokes.ε_pl), dt)
 
+    @parallel (@idx ni .+ 1) multi_copy!(@tensor(stokes.τ_o), @tensor(stokes.τ))
+    @parallel (@idx ni) multi_copy!(@tensor_center(stokes.τ_o), @tensor_center(stokes.τ))
+
     return (
         iter=iter,
         err_evo1=err_evo1,

diff --git a/src/variational_stokes/Stokes3D.jl b/src/variational_stokes/Stokes3D.jl
@@ -0,0 +1,221 @@
+## 3D VISCO-ELASTIC STOKES SOLVER
+
+# backend trait
+function solve_VariationalStokes!(stokes::JustRelax.StokesArrays, args...; kwargs)
+    solve_VariationalStokes!(backend(stokes), stokes, args...; kwargs)
+    return nothing
+end
+
+# entry point for extensions
+function solve_VariationalStokes!(::CPUBackendTrait, stokes, args...; kwargs)
+    return _solve_VS!(stokes, args...; kwargs...)
+end
+
+
+# GeoParams and multiple phases
+function _solve!(
+    stokes::JustRelax.StokesArrays,
+    pt_stokes,
+    di::NTuple{3,T},
+    flow_bcs::AbstractFlowBoundaryConditions,
+    ρg,
+    phase_ratios::JustPIC.PhaseRatios,
+    ϕ::JustRelax.RockRatio,
+    rheology::NTuple{N,AbstractMaterialParamsStruct},
+    args,
+    dt,
+    igg::IGG;
+    iterMax=10e3,
+    nout=500,
+    b_width=(4, 4, 4),
+    verbose=true,
+    viscosity_relaxation=1e-2,
+    viscosity_cutoff=(-Inf, Inf),
+    kwargs...,
+) where {T,N}
+
+    ## UNPACK
+
+    # solver related
+    ϵ = pt_stokes.ϵ
+    # geometry
+    _di = @. 1 / di
+    ni = size(stokes.P)
+    (; η, η_vep) = stokes.viscosity
+
+    # errors
+    err = Inf
+    iter = 0
+    cont = 0
+    err_evo1 = Float64[]
+    err_evo2 = Int64[]
+    norm_Rx = Float64[]
+    norm_Ry = Float64[]
+    norm_Rz = Float64[]
+    norm_∇V = Float64[]
+
+    @copy stokes.P0 stokes.P
+    θ = deepcopy(stokes.P)
+    λ = @zeros(ni...)
+    λv_yz = @zeros(size(stokes.τ.yz)...)
+    λv_xz = @zeros(size(stokes.τ.xz)...)
+    λv_xy = @zeros(size(stokes.τ.xy)...)
+
+    # solver loop
+    wtime0 = 0.0
+    ητ = deepcopy(η)
+
+    # compute buoyancy forces and viscosity
+    compute_ρg!(ρg, phase_ratios, rheology, args)
+    compute_viscosity!(stokes, phase_ratios, args, rheology, viscosity_cutoff)
+
+    # convert displacement to velocity
+    displacement2velocity!(stokes, dt, flow_bcs)
+
+    while iter < 2 || (err > ϵ && iter ≤ iterMax)
+        wtime0 += @elapsed begin
+            # ~preconditioner
+            compute_maxloc!(ητ, η)
+            update_halo!(ητ)
+
+            @parallel (@idx ni) compute_∇V!(stokes.∇V, @velocity(stokes)..., _di...)
+            compute_P!(
+                θ,
+                stokes.P0,
+                stokes.R.RP,
+                stokes.∇V,
+                ητ,
+                rheology,
+                phase_ratios.center,
+                dt,
+                pt_stokes.r,
+                pt_stokes.θ_dτ,
+                args,
+            )
+
+            @parallel (@idx ni) compute_strain_rate!(
+                stokes.∇V, @strain(stokes)..., @velocity(stokes)..., ϕ, _di...
+            )
+
+            # Update buoyancy
+            update_ρg!(ρg, phase_ratios, rheology, args)
+
+            # Update viscosity
+            update_viscosity!(
+                stokes,
+                phase_ratios,
+                args,
+                rheology,
+                viscosity_cutoff;
+                air_phase=air_phase,
+                relaxation=viscosity_relaxation,
+            )
+            # update_stress!(stokes, θ, λ, phase_ratios, rheology, dt, pt_stokes.θ_dτ)
+
+            @parallel (@idx ni .+ 1) update_stresses_center_vertex!(
+                @strain(stokes),
+                @tensor_center(stokes.ε_pl),
+                stokes.EII_pl,
+                @tensor_center(stokes.τ),
+                (stokes.τ.yz, stokes.τ.xz, stokes.τ.xy),
+                @tensor_center(stokes.τ_o),
+                (stokes.τ_o.yz, stokes.τ_o.xz, stokes.τ_o.xy),
+                θ,
+                stokes.P,
+                stokes.viscosity.η,
+                λ,
+                (λv_yz, λv_xz, λv_xy),
+                stokes.τ.II,
+                stokes.viscosity.η_vep,
+                0.2,
+                dt,
+                pt_stokes.θ_dτ,
+                rheology,
+                phase_ratios.center,
+                phase_ratios.vertex,
+                phase_ratios.xy,
+                phase_ratios.yz,
+                phase_ratios.xz,
+                ϕ,
+            )
+            update_halo!(stokes.τ.yz)
+            update_halo!(stokes.τ.xz)
+            update_halo!(stokes.τ.xy)
+
+            @hide_communication b_width begin # communication/computation overlap
+                @parallel compute_V!(
+                    @velocity(stokes)...,
+                    @residuals(stokes.R)...,
+                    stokes.P,
+                    ρg...,
+                    @stress(stokes)...,
+                    ητ,
+                    pt_stokes.ηdτ,
+                    ϕ,
+                    _di...,
+                )
+                # apply boundary conditions
+                velocity2displacement!(stokes, dt)
+                free_surface_bcs!(stokes, flow_bcs, η, rheology, phase_ratios, dt, di)
+                flow_bcs!(stokes, flow_bcs)
+                update_halo!(@velocity(stokes)...)
+            end
+        end
+
+        iter += 1
+        if iter % nout == 0 && iter > 1
+            cont += 1
+            for (norm_Ri, Ri) in zip((norm_Rx, norm_Ry, norm_Rz), @residuals(stokes.R))
+                push!(
+                    norm_Ri,
+                    norm_mpi(Ri[2:(end - 1), 2:(end - 1), 2:(end - 1)]) / length(Ri),
+                )
+            end
+            push!(norm_∇V, norm_mpi(stokes.R.RP) / length(stokes.R.RP))
+            err = max(norm_Rx[cont], norm_Ry[cont], norm_Rz[cont], norm_∇V[cont])
+            push!(err_evo1, err)
+            push!(err_evo2, iter)
+            if igg.me == 0 && (verbose || iter == iterMax)
+                @printf(
+                    "iter = %d, err = %1.3e [norm_Rx=%1.3e, norm_Ry=%1.3e, norm_Rz=%1.3e, norm_∇V=%1.3e] \n",
+                    iter,
+                    err,
+                    norm_Rx[cont],
+                    norm_Ry[cont],
+                    norm_Rz[cont],
+                    norm_∇V[cont]
+                )
+            end
+            isnan(err) && error("NaN(s)")
+        end
+
+        if igg.me == 0 && err ≤ ϵ
+            println("Pseudo-transient iterations converged in $iter iterations")
+        end
+    end
+
+    av_time = wtime0 / (iter - 1) # average time per iteration
+
+    # compute vorticity
+    @parallel (@idx ni .+ 1) compute_vorticity!(
+        stokes.ω.yz, stokes.ω.xz, stokes.ω.xy, @velocity(stokes)..., inv.(di)...
+    )
+
+    # accumulate plastic strain tensor
+    @parallel (@idx ni) accumulate_tensor!(stokes.EII_pl, @tensor_center(stokes.ε_pl), dt)
+
+    @parallel (@idx ni .+ 1) multi_copy!(@tensor(stokes.τ_o), @tensor(stokes.τ))
+    @parallel (@idx ni) multi_copy!(@tensor_center(stokes.τ_o), @tensor_center(stokes.τ))
+
+    return (
+        iter=iter,
+        err_evo1=err_evo1,
+        err_evo2=err_evo2,
+        norm_Rx=norm_Rx,
+        norm_Ry=norm_Ry,
+        norm_Rz=norm_Rz,
+        norm_∇V=norm_∇V,
+        time=wtime0,
+        av_time=av_time,
+    )
+end