remove IB support and precompute pressure gradients

wilfonba · wilfonba · commit 96d5f2f2a983 · 2026-02-15T09:15:37.000-05:00
diff --git a/src/simulation/m_bubbles_EL.fpp b/src/simulation/m_bubbles_EL.fpp
@@ -31,6 +31,8 @@ module m_bubbles_EL
 
     use m_ibm
 
+    use m_finite_differences
+
     implicit none
 
     !(nBub)
@@ -189,6 +191,29 @@ contains
         $:GPU_UPDATE(device='[moving_lag_bubbles, lag_pressure_force, &
             & lag_gravity_force, lag_vel_model, lag_drag_model]')
 
+        ! Allocate cell-centered pressure gradient arrays and FD coefficients
+        if (lag_params%vel_model > 0 .and. lag_params%pressure_force) then
+            @:ALLOCATE(grad_p_x(0:m, 0:n, 0:p))
+            @:ALLOCATE(fd_coeff_x_pgrad(-fd_number:fd_number, 0:m))
+            call s_compute_finite_difference_coefficients(m, x_cc, fd_coeff_x_pgrad, &
+                                                          buff_size, fd_number, fd_order)
+            $:GPU_UPDATE(device='[fd_coeff_x_pgrad]')
+            if (n > 0) then
+                @:ALLOCATE(grad_p_y(0:m, 0:n, 0:p))
+                @:ALLOCATE(fd_coeff_y_pgrad(-fd_number:fd_number, 0:n))
+                call s_compute_finite_difference_coefficients(n, y_cc, fd_coeff_y_pgrad, &
+                                                              buff_size, fd_number, fd_order)
+                $:GPU_UPDATE(device='[fd_coeff_y_pgrad]')
+            end if
+            if (p > 0) then
+                @:ALLOCATE(grad_p_z(0:m, 0:n, 0:p))
+                @:ALLOCATE(fd_coeff_z_pgrad(-fd_number:fd_number, 0:p))
+                call s_compute_finite_difference_coefficients(p, z_cc, fd_coeff_z_pgrad, &
+                                                              buff_size, fd_number, fd_order)
+                $:GPU_UPDATE(device='[fd_coeff_z_pgrad]')
+            end if
+        end if
+
         call s_read_input_bubbles(q_cons_vf, bc_type)
 
     end subroutine s_initialize_bubbles_EL_module
@@ -612,10 +637,9 @@ contains
 
         integer :: k, l
 
-        call nvtxStartRange("LAGRANGE-BUBBLE-DYNAMICS")
-
         ! Subgrid p_inf model based on Maeda and Colonius (2018).
         if (lag_params%pressure_corrector) then
+            call nvtxStartRange("LAGRANGE-BUBBLE-PINF-CORRECTION")
             ! Calculate velocity potentials (valid for one bubble per cell)
             $:GPU_PARALLEL_LOOP(private='[k,cell,paux,preterm1,term2,Romega,myR0,myR,myV,myPb,pint,term1_fac]')
             do k = 1, n_el_bubs_loc
@@ -635,8 +659,17 @@ contains
                 end if
             end do
             $:END_GPU_PARALLEL_LOOP()
+            call nvtxEndRange()
+        end if
+
+        ! Precompute cell-centered pressure gradients for translational motion
+        if (moving_lag_bubbles .and. lag_pressure_force) then
+            call nvtxStartRange("LAGRANGE-BUBBLE-PRESSURE-GRADIENT")
+            call s_compute_pressure_gradients(q_prim_vf)
+            call nvtxEndRange()
         end if
 
+        call nvtxStartRange("LAGRANGE-BUBBLE-DYNAMICS")
         ! Radial motion model
         adap_dt_stop_sum = 0
         $:GPU_PARALLEL_LOOP(private='[k,myalpha_rho,myalpha,Re,cell,myVapFlux,preterm1, term2, paux, pint, Romega,term1_fac,myR_m, mygamma_m, myPb, myMass_n, myMass_v,myR, myV, myBeta_c, myBeta_t, myR0, myPbdot, myMvdot,myPinf, aux1,aux2, myCson, myRho,gamma,pi_inf,qv,dmalf, dmntait, dmBtait, dm_bub_adv_src, dm_divu,adap_dt_stop,myPos,myVel]', &
@@ -737,6 +770,7 @@ contains
 
         end do
         $:END_GPU_PARALLEL_LOOP()
+        call nvtxEndRange
 
         if (adap_dt .and. adap_dt_stop_sum > 0) call s_mpi_abort("Adaptive time stepping failed to converge.")
 
@@ -746,8 +780,6 @@ contains
             call s_smear_voidfraction(bc_type)
         end if
 
-        call nvtxEndRange
-
     end subroutine s_compute_bubble_EL_dynamics
 
     !>  The purpose of this subroutine is to obtain the bubble source terms based on Maeda and Colonius (2018)
@@ -763,6 +795,7 @@ contains
 
         integer :: i, j, k, l
 
+        call nvtxStartRange("LAGRANGE-BUBBLE-EL-SOURCE")
         ! (q / (1 - beta)) * d(beta)/dt source
         if (p == 0) then
             $:GPU_PARALLEL_LOOP(private='[i,j,k,l]', collapse=4)
@@ -846,6 +879,7 @@ contains
             end do
             $:END_GPU_PARALLEL_LOOP()
         end do
+        call nvtxEndRange ! LAGRANGE-BUBBLE-EL-SOURCE
 
     end subroutine s_compute_bubbles_EL_source
 
@@ -892,7 +926,7 @@ contains
         type(integer_field), dimension(1:num_dims, 1:2), intent(in) :: bc_type
         integer :: i, j, k, l
 
-        call nvtxStartRange("BUBBLES-LAGRANGE-KERNELS")
+        call nvtxStartRange("BUBBLES-LAGRANGE-SMEARING")
         $:GPU_PARALLEL_LOOP(private='[i,j,k,l]', collapse=4)
         do i = 1, q_beta_idx
             do l = idwbuff(3)%beg, idwbuff(3)%end
@@ -929,7 +963,7 @@ contains
             end do
         end do
         $:END_GPU_PARALLEL_LOOP()
-        call nvtxEndRange ! BUBBLES-LAGRANGE-KERNELS
+        call nvtxEndRange ! BUBBLES-LAGRANGE-SMEARING
 
     end subroutine s_smear_voidfraction
 
@@ -1483,26 +1517,6 @@ contains
                 if (q_prim_vf(advxb)%sf(cell(1), cell(2), cell(3)) < (1._wp - lag_params%valmaxvoid)) then
                     keep_bubble(k) = 0
                 end if
-
-                ! Move bubbles back to surface of IB
-                if (ib) then
-                    cell = fd_number - buff_size
-                    call s_locate_cell(mtn_pos(k, 1:3, 2), cell, mtn_s(k, 1:3, 2))
-
-                    if (ib_markers%sf(cell(1), cell(2), cell(3)) /= 0) then
-                        patch_id = ib_markers%sf(cell(1), cell(2), cell(3))
-
-                        $:GPU_LOOP(parallelism='[seq]')
-                        do i = 1, num_dims
-                            mtn_pos(k, i, 2) = mtn_pos(k, i, 2) - &
-                                               levelset_norm%sf(cell(1), cell(2), cell(3), patch_id, i) &
-                                               *levelset%sf(cell(1), cell(2), cell(3), patch_id)
-                        end do
-
-                        cell = fd_number - buff_size
-                        call s_locate_cell(mtn_pos(k, 1:3, 2), cell, mtn_s(k, 1:3, 2))
-                    end if
-                end if
             end if
         end do
         $:END_GPU_PARALLEL_LOOP()
@@ -2229,6 +2243,20 @@ contains
         @:DEALLOCATE(mtn_dposdt)
         @:DEALLOCATE(mtn_dveldt)
 
+        ! Deallocate pressure gradient arrays and FD coefficients
+        if (lag_params%vel_model > 0 .and. lag_params%pressure_force) then
+            @:DEALLOCATE(grad_p_x)
+            @:DEALLOCATE(fd_coeff_x_pgrad)
+            if (n > 0) then
+                @:DEALLOCATE(grad_p_y)
+                @:DEALLOCATE(fd_coeff_y_pgrad)
+                if (p > 0) then
+                    @:DEALLOCATE(grad_p_z)
+                    @:DEALLOCATE(fd_coeff_z_pgrad)
+                end if
+            end if
+        end if
+
     end subroutine s_finalize_lagrangian_solver
 
 end module m_bubbles_EL
diff --git a/src/simulation/m_bubbles_EL_kernels.fpp b/src/simulation/m_bubbles_EL_kernels.fpp
@@ -12,6 +12,16 @@ module m_bubbles_EL_kernels
 
     implicit none
 
+    ! Cell-centered pressure gradients (precomputed for translational motion)
+    real(wp), allocatable, dimension(:, :, :) :: grad_p_x, grad_p_y, grad_p_z
+    $:GPU_DECLARE(create='[grad_p_x, grad_p_y, grad_p_z]')
+
+    ! Finite-difference coefficients for pressure gradient computation
+    real(wp), allocatable, dimension(:, :) :: fd_coeff_x_pgrad
+    real(wp), allocatable, dimension(:, :) :: fd_coeff_y_pgrad
+    real(wp), allocatable, dimension(:, :) :: fd_coeff_z_pgrad
+    $:GPU_DECLARE(create='[fd_coeff_x_pgrad, fd_coeff_y_pgrad, fd_coeff_z_pgrad]')
+
 contains
 
     !> The purpose of this subroutine is to smear the strength of the lagrangian
@@ -372,6 +382,71 @@ contains
 
     end subroutine s_get_cell
 
+    !> Precomputes cell-centered pressure gradients (dp/dx, dp/dy, dp/dz) at all cell centers
+        !!      using finite-difference coefficients of the specified order. This avoids
+        !!      scattered memory accesses to the pressure field when computing translational
+        !!      bubble forces.
+        !! @param q_prim_vf Primitive variables (pressure is at index E_idx)
+    subroutine s_compute_pressure_gradients(q_prim_vf)
+
+        type(scalar_field), dimension(sys_size), intent(in) :: q_prim_vf
+
+        integer :: i, j, k, r
+
+        ! dp/dx at all cell centers
+        $:GPU_PARALLEL_LOOP(private='[i,j,k,r]', collapse=3)
+        do k = 0, p
+            do j = 0, n
+                do i = 0, m
+                    grad_p_x(i, j, k) = 0._wp
+                    $:GPU_LOOP(parallelism='[seq]')
+                    do r = -fd_number, fd_number
+                        grad_p_x(i, j, k) = grad_p_x(i, j, k) + &
+                                            q_prim_vf(E_idx)%sf(i + r, j, k)*fd_coeff_x_pgrad(r, i)
+                    end do
+                end do
+            end do
+        end do
+        $:END_GPU_PARALLEL_LOOP()
+
+        ! dp/dy at all cell centers
+        if (n > 0) then
+            $:GPU_PARALLEL_LOOP(private='[i,j,k,r]', collapse=3)
+            do k = 0, p
+                do j = 0, n
+                    do i = 0, m
+                        grad_p_y(i, j, k) = 0._wp
+                        $:GPU_LOOP(parallelism='[seq]')
+                        do r = -fd_number, fd_number
+                            grad_p_y(i, j, k) = grad_p_y(i, j, k) + &
+                                                q_prim_vf(E_idx)%sf(i, j + r, k)*fd_coeff_y_pgrad(r, j)
+                        end do
+                    end do
+                end do
+            end do
+            $:END_GPU_PARALLEL_LOOP()
+        end if
+
+        ! dp/dz at all cell centers
+        if (p > 0) then
+            $:GPU_PARALLEL_LOOP(private='[i,j,k,r]', collapse=3)
+            do k = 0, p
+                do j = 0, n
+                    do i = 0, m
+                        grad_p_z(i, j, k) = 0._wp
+                        $:GPU_LOOP(parallelism='[seq]')
+                        do r = -fd_number, fd_number
+                            grad_p_z(i, j, k) = grad_p_z(i, j, k) + &
+                                                q_prim_vf(E_idx)%sf(i, j, k + r)*fd_coeff_z_pgrad(r, k)
+                        end do
+                    end do
+                end do
+            end do
+            $:END_GPU_PARALLEL_LOOP()
+        end if
+
+    end subroutine s_compute_pressure_gradients
+
     !! This function interpolates the velocity of Eulerian field at the position
             !! of the bubble.
             !! @param pos Position of the bubble in directiion i
@@ -491,74 +566,8 @@ contains
         integer, intent(in) :: i
         type(scalar_field), dimension(sys_size), intent(in) :: q_prim_vf
 
-        real(wp) :: a, dp, vol, force
+        real(wp) :: dp, vol, force
         real(wp) :: v_rel
-        real(wp), dimension(fd_order) :: xi, eta, L
-
-        if (fd_order <= 2) then
-            if (i == 1) then
-                dp = (q_prim_vf(E_idx)%sf(cell(1) + 1, cell(2), cell(3)) - &
-                      q_prim_vf(E_idx)%sf(cell(1) - 1, cell(2), cell(3)))/ &
-                     (x_cc(cell(1) + 1) - x_cc(cell(1) - 1))
-            elseif (i == 2) then
-                dp = (q_prim_vf(E_idx)%sf(cell(1), cell(2) + 1, cell(3)) - &
-                      q_prim_vf(E_idx)%sf(cell(1), cell(2) - 1, cell(3)))/ &
-                     (y_cc(cell(2) + 1) - y_cc(cell(2) - 1))
-            elseif (i == 3) then
-                dp = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) + 1) - &
-                      q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) - 1))/ &
-                     (z_cc(cell(3) + 1) - z_cc(cell(3) - 1))
-            end if
-        elseif (fd_order == 4) then
-            if (i == 1) then
-                xi(1) = x_cc(cell(1) - 1)
-                eta(1) = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1) - 2, cell(2), cell(3)))/ &
-                         (x_cc(cell(1)) - x_cc(cell(1) - 2))
-                xi(2) = x_cc(cell(1))
-                eta(2) = (q_prim_vf(E_idx)%sf(cell(1) + 1, cell(2), cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1) - 1, cell(2), cell(3)))/ &
-                         (x_cc(cell(1) + 1) - x_cc(cell(1) - 1))
-                xi(3) = x_cc(cell(1) + 1)
-                eta(3) = (q_prim_vf(E_idx)%sf(cell(1) + 2, cell(2), cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)))/ &
-                         (x_cc(cell(1) + 2) - x_cc(cell(1)))
-            elseif (i == 2) then
-                xi(1) = y_cc(cell(2) - 1)
-                eta(1) = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2) - 2, cell(3)))/ &
-                         (y_cc(cell(2)) - y_cc(cell(2) - 2))
-                xi(2) = y_cc(cell(2))
-                eta(2) = (q_prim_vf(E_idx)%sf(cell(1), cell(2) + 1, cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2) - 1, cell(3)))/ &
-                         (y_cc(cell(2) + 1) - y_cc(cell(2) - 1))
-                xi(3) = y_cc(cell(2) + 1)
-                eta(3) = (q_prim_vf(E_idx)%sf(cell(1), cell(2) + 2, cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)))/ &
-                         (y_cc(cell(2) + 2) - y_cc(cell(2)))
-            elseif (i == 3) then
-                xi(1) = z_cc(cell(3) - 1)
-                eta(1) = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) - 2))/ &
-                         (z_cc(cell(3)) - z_cc(cell(3) - 2))
-                xi(2) = z_cc(cell(3))
-                eta(2) = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) + 1) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) - 1))/ &
-                         (z_cc(cell(3) + 1) - z_cc(cell(3) - 1))
-                xi(3) = z_cc(cell(3) + 1)
-                eta(3) = (q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3) + 2) - &
-                          q_prim_vf(E_idx)%sf(cell(1), cell(2), cell(3)))/ &
-                         (z_cc(cell(3) + 2) - z_cc(cell(3)))
-            end if
-
-            L(1) = ((pos - xi(2))*(pos - xi(3)))/((xi(1) - xi(2))*(xi(1) - xi(3)))
-            L(2) = ((pos - xi(1))*(pos - xi(3)))/((xi(2) - xi(1))*(xi(2) - xi(3)))
-            L(3) = ((pos - xi(1))*(pos - xi(2)))/((xi(3) - xi(1))*(xi(3) - xi(2)))
-
-            dp = L(1)*eta(1) + L(2)*eta(2) + L(3)*eta(3)
-        end if
-
-        vol = (4._wp/3._wp)*pi*(rad**3._wp)
 
         if (fd_order > 1) then
             v_rel = vel - f_interpolate_velocity(pos, cell, i, q_prim_vf)
@@ -576,7 +585,17 @@ contains
             force = force - (12._wp*pi*rad*v_rel)/Re
         end if
 
-        if (lag_params%pressure_force) then
+        if (lag_pressure_force) then
+            ! Use precomputed cell-centered pressure gradients
+            if (i == 1) then
+                dp = grad_p_x(cell(1), cell(2), cell(3))
+            elseif (i == 2) then
+                dp = grad_p_y(cell(1), cell(2), cell(3))
+            elseif (i == 3) then
+                dp = grad_p_z(cell(1), cell(2), cell(3))
+            end if
+
+            vol = (4._wp/3._wp)*pi*(rad**3._wp)
             force = force - vol*dp
         end if