sweep_coupled_implicit_terms Subroutine

public subroutine sweep_coupled_implicit_terms(this, pf, lev, t0, dt)

Uses

  • proc~~sweep_coupled_implicit_terms~~UsesGraph proc~sweep_coupled_implicit_terms sweep_coupled_implicit_terms module~pf_mod_timer pf_mod_timer proc~sweep_coupled_implicit_terms->module~pf_mod_timer module~pf_mod_dtype pf_mod_dtype module~pf_mod_timer->module~pf_mod_dtype iso_c_binding iso_c_binding module~pf_mod_dtype->iso_c_binding

Arguments

Type IntentOptional AttributesName
class(pf_amisdcQ_t), intent(inout) :: this
type(pf_pfasst_t), intent(inout) :: pf
class(pf_level_t), intent(inout) :: lev
real(kind=pfdp), intent(in) :: t0
real(kind=pfdp), intent(in) :: dt

Calls

proc~~sweep_coupled_implicit_terms~~CallsGraph proc~sweep_coupled_implicit_terms sweep_coupled_implicit_terms proc~start_timer start_timer proc~sweep_coupled_implicit_terms->proc~start_timer proc~end_timer end_timer proc~sweep_coupled_implicit_terms->proc~end_timer

Called by

proc~~sweep_coupled_implicit_terms~~CalledByGraph proc~sweep_coupled_implicit_terms sweep_coupled_implicit_terms proc~amisdcq_sweep amisdcQ_sweep proc~amisdcq_sweep->proc~sweep_coupled_implicit_terms

Contents


Source Code

  subroutine sweep_coupled_implicit_terms(this, pf, lev, t0, dt)
    use pf_mod_timer
    class(pf_amisdcQ_t), intent(inout) :: this
    type(pf_pfasst_t),   intent(inout) :: pf
    real(pfdp),          intent(in)    :: dt, t0
    class(pf_level_t),   intent(inout) :: lev

    integer                        :: m, n
    real(pfdp)                     :: t
    real(pfdp)                     :: dtsdc(1:lev%nnodes-1)
    class(pf_encap_t), allocatable :: rhsA, rhsB, QA, QB
    class(pf_encap_t), allocatable :: S2(:), S3(:)

    call start_timer(pf, TLEVEL+lev%index-1)
   
    call lev%ulevel%factory%create_array(S2,lev%nnodes-1,lev%index,lev%shape)
    call lev%ulevel%factory%create_array(S3,lev%nnodes-1,lev%index,lev%shape)
    
    ! compute integrals and add fas correction
    do m = 1, lev%nnodes-1

       call lev%S(m)%setval(0.0_pfdp)
       call S2(m)%setval(0.0d0)
       call S3(m)%setval(0.0d0)

       do n = 1, lev%nnodes
          call lev%S(m)%axpy(dt*this%QdiffE(m,n), lev%F(n,1))
          call lev%S(m)%axpy(1.0_pfdp*dt*lev%qmat(m,n),    lev%F(n,2))
          call lev%S(m)%axpy(1.0_pfdp*dt*lev%qmat(m,n),    lev%F(n,3))
          call S2(m)%axpy(2.0_pfdp*dt*this%QtilI(m,n),     lev%F(n,2))
          call S3(m)%axpy(2.0_pfdp*dt*this%QtilI(m,n),     lev%F(n,3))
       end do
       if (allocated(lev%tauQ)) then
          call lev%S(m)%axpy(1.0_pfdp, lev%tauQ(m))
       end if
    end do

    ! do the time-stepping
    call lev%Q(1)%copy(lev%q0)

    call this%f1eval(lev%Q(1), t0, lev%index, lev%F(1,1))
    call this%f2eval(lev%Q(1), t0, lev%index, lev%F(1,2))
    call this%f3eval(lev%Q(1), t0, lev%index, lev%F(1,3))

    call lev%ulevel%factory%create_single(rhsA, lev%index,   lev%shape)
    call lev%ulevel%factory%create_single(rhsB, lev%index,   lev%shape)
    call lev%ulevel%factory%create_single(QA,   lev%index,   lev%shape)
    call lev%ulevel%factory%create_single(QB,   lev%index,   lev%shape)

    call QA%setval(0.0_pfdp)
    call QB%setval(0.0_pfdp)

    t = t0
    dtsdc = dt * (lev%nodes(2:lev%nnodes) - lev%nodes(1:lev%nnodes-1))
    do m = 1, lev%nnodes-1
       t = t + dtsdc(m)
             
       call rhsA%copy(lev%Q(1))
       ! First compute the explicit part of the right-hand side
       do n = 1, m
          call rhsA%axpy(dt*this%QtilE(m,n), lev%F(n,1))  
       end do
       call rhsA%axpy(1.0_pfdp, lev%S(m))
   
       ! Save the right-hand side with only the explicit contribution
       call rhsB%copy(rhsA)

       ! Add the first implicit part to the right-hand side and solve for the first asynchronous update
       do n = 1, m
          call rhsA%axpy(2.0_pfdp*dt*this%QtilI(m,n), lev%F(n,2))  
       end do
       call rhsA%axpy(-1.0_pfdp, S2(m))  
       call this%f2comp(QA, t, 2.0_pfdp*dt*this%QtilI(m,m+1), rhsA, lev%index, lev%F(m+1,2))

       ! Add the second implicit part to the right-hand side and solve for the second asynchronous update
       do n = 1, m
          call rhsB%axpy(2.0_pfdp*dt*this%QtilI(m,n), lev%F(n,3))  
       end do
       call rhsB%axpy(-1.0_pfdp, S3(m))  
       call this%f3comp(QB, t, 2.0_pfdp*dt*this%QtilI(m,m+1), rhsB, lev%index, lev%F(m+1,3))

       ! Now we average the two asynchronous updates
       call lev%Q(m+1)%setval(0.0_pfdp)
       call lev%Q(m+1)%axpy(0.5_pfdp, QA)
       call lev%Q(m+1)%axpy(0.5_pfdp, QB)

       ! Evaluate the three right-hand sides with the updated variables
       call this%f1eval(lev%Q(m+1), t, lev%index, lev%F(m+1,1))
       call this%f2eval(lev%Q(m+1), t, lev%index, lev%F(m+1,2))
       call this%f3eval(lev%Q(m+1), t, lev%index, lev%F(m+1,3))
    end do

    call lev%qend%copy(lev%Q(lev%nnodes))

    call lev%ulevel%factory%destroy_array(S2,lev%nnodes-1,lev%index,lev%shape)
    call lev%ulevel%factory%destroy_array(S3,lev%nnodes-1,lev%index,lev%shape)
    call lev%ulevel%factory%destroy_single(rhsA, lev%index,   lev%shape)
    call lev%ulevel%factory%destroy_single(rhsB, lev%index,   lev%shape)
    call lev%ulevel%factory%destroy_single(QA,   lev%index,   lev%shape)
    call lev%ulevel%factory%destroy_single(QB,   lev%index,   lev%shape)

    call end_timer(pf, TLEVEL+lev%index-1)

  end subroutine sweep_coupled_implicit_terms