releases/vn0.8/fftsolver_8F90_source.html

 module fftsolver_mod
   use datadefn_mod, only : default_precision
   use grids_mod, only : x_index, y_index, z_index
   use state_mod, only : model_state_type
   use monc_component_mod, only : component_descriptor_type
   use pencil_fft_mod, only : initialise_pencil_fft, finalise_pencil_fft, perform_forward_3dfft, perform_backwards_3dfft
   use communication_types_mod, only : halo_communication_type, neighbour_description_type, field_data_wrapper_type
   use halo_communication_mod, only : copy_buffer_to_field, copy_field_to_buffer, perform_local_data_copy_for_field, &
        init_halo_communication, finalise_halo_communication, blocking_halo_swap, get_single_field_per_halo_cell
   use registry_mod, only : is_component_enabled
   use logging_mod, only : log_error, log_master_log
   use mpi, only : mpi_request_null, mpi_statuses_ignore
   implicit none

 #ifndef TEST_MODE
   private
 #endif

   real(kind=DEFAULT_PRECISION), dimension(:), allocatable :: cos_x, cos_y
   real(kind=DEFAULT_PRECISION) :: pi
   real(kind=DEFAULT_PRECISION), dimension(:,:,:), allocatable :: pt
   integer :: fourier_space_sizes(3)
   type(halo_communication_type), save :: halo_swap_state

   public fftsolver_get_descriptor
 contains

   type(component_descriptor_type) function fftsolver_get_descriptor()
     fftsolver_get_descriptor%name="fftsolver"
     fftsolver_get_descriptor%version=0.1
     fftsolver_get_descriptor%initialisation=>initialisation_callback
     fftsolver_get_descriptor%timestep=>timestep_callback
     fftsolver_get_descriptor%finalisation=>finalisation_callback
   end function fftsolver_get_descriptor

   subroutine initialisation_callback(current_state)
     type(model_state_type), target, intent(inout) :: current_state

     integer :: i, my_y_start, my_x_start

     if (.not. is_component_enabled(current_state%options_database, "diverr")) then
       call log_master_log(log_error, "The FFT solver component requires the diverr component to be enabled")
     end if

     pi=4.0_default_precision*atan(1.0_default_precision)

     fourier_space_sizes=initialise_pencil_fft(current_state, my_y_start, my_x_start)

     call init_halo_communication(current_state, get_single_field_per_halo_cell, halo_swap_state, 1, .false.)

     allocate(pt(fourier_space_sizes(z_index), fourier_space_sizes(y_index), fourier_space_sizes(x_index)))

 #ifdef U_ACTIVE
     allocate(cos_x(fourier_space_sizes(x_index)))
     do i=1, fourier_space_sizes(x_index)
       cos_x(i)=(2.0_default_precision/(current_state%global_grid%configuration%horizontal%dx*&
            current_state%global_grid%configuration%horizontal%dx))&
            *(cos(2.0_default_precision*pi*real(((i-1)+(my_x_start-1))/2, kind=default_precision)/&
            real(current_state%global_grid%size(X_INDEX), kind=default_precision))-1.0_default_precision)
     end do
 #endif

 #ifdef V_ACTIVE
     allocate(cos_y(fourier_space_sizes(y_index)))
     do i=1, fourier_space_sizes(y_index)
       cos_y(i)=(2.0_default_precision/(current_state%global_grid%configuration%horizontal%dy*&
            current_state%global_grid%configuration%horizontal%dy))&
            *(cos(2.0_default_precision*pi*real(((i-1)+(my_y_start-1))/2, kind=default_precision)/&
            real(current_state%global_grid%size(Y_INDEX), kind=default_precision))-1.0_default_precision)
     end do
 #endif
     current_state%psrce_x_hs_send_request=mpi_request_null
     current_state%psrce_y_hs_send_request=mpi_request_null
     current_state%psrce_x_hs_recv_request=mpi_request_null
     current_state%psrce_y_hs_recv_request=mpi_request_null
   end subroutine initialisation_callback

   subroutine timestep_callback(current_state)
     type(model_state_type), target, intent(inout) :: current_state

     integer :: start_loc(3), end_loc(3), i

     do i=1,3
       start_loc(i)=current_state%local_grid%local_domain_start_index(i)
       end_loc(i)=current_state%local_grid%local_domain_end_index(i)
     end do

     call complete_psrce_calculation(current_state, current_state%local_grid%halo_size(y_index), &
          current_state%local_grid%halo_size(x_index))

 #ifdef FFT_TEST_MODE
     current_state%p%data=real(current_state%parallel%my_rank, kind=8) + 1.d0
 #endif

     call perform_forward_3dfft(current_state, current_state%p%data(start_loc(z_index):end_loc(z_index), &
          start_loc(y_index):end_loc(y_index), start_loc(x_index):end_loc(x_index)), pt)

 #ifndef FFT_TEST_MODE
     call tridiagonal_solver(current_state, pt, fourier_space_sizes)
 #endif

     ! Here it is complex space, distributed as needed. The other option is real space but with +1 for the last process in Y
     ! as require that complex number - not sure the best approach. We can extract the values here from complex anyway so
     ! worth trying that first. Operating on the size of pt rather than grid sizes. Downside of real space xform is then we have +1
     ! in the forwards transformation
     call perform_backwards_3dfft(current_state, pt, current_state%p%data(start_loc(z_index):end_loc(z_index), &
          start_loc(y_index):end_loc(y_index), start_loc(x_index):end_loc(x_index)))

 #ifdef FFT_TEST_MODE
     if (current_state%parallel%my_rank == 1) then
       write(*,*) current_state%parallel%my_rank, current_state%p%data(:,3,3)
     end if
 #endif

     call blocking_halo_swap(current_state, halo_swap_state, copy_p_to_halo_buffer, &
          perform_local_data_copy_for_p, copy_halo_buffer_to_p)

   end subroutine timestep_callback

   subroutine finalisation_callback(current_state)
     type(model_state_type), target, intent(inout) :: current_state

     call finalise_pencil_fft(current_state%parallel%monc_communicator)
     deallocate(pt)
     if (allocated(cos_x)) deallocate(cos_x)
     if (allocated(cos_y)) deallocate(cos_y)
   end subroutine finalisation_callback

   subroutine complete_psrce_calculation(current_state, y_halo_size, x_halo_size)
     type(model_state_type), target, intent(inout) :: current_state
     integer, intent(in) :: y_halo_size, x_halo_size

     integer :: ierr, combined_handles(2), i, j, k

     combined_handles(1)=current_state%psrce_x_hs_recv_request
     combined_handles(2)=current_state%psrce_y_hs_recv_request
     call mpi_waitall(2, combined_handles, mpi_statuses_ignore, ierr)

     do j=current_state%local_grid%local_domain_start_index(y_index), current_state%local_grid%local_domain_end_index(y_index)
       do k=2,current_state%local_grid%size(z_index)
 #ifdef U_ACTIVE
         current_state%p%data(k,j,x_halo_size+1)=current_state%p%data(k,j,x_halo_size+1)-&
                current_state%psrce_recv_buffer_x(k-1,j-x_halo_size)
 #endif
 #ifdef V_ACTIVE
         if (j .gt. y_halo_size+1) current_state%p%data(k, j, x_halo_size+1)=current_state%p%data(k, j, x_halo_size+1)-&
              current_state%global_grid%configuration%horizontal%cy * current_state%sv%data(k, j-1, x_halo_size+1)
 #endif
       end do
     end do

 #ifdef V_ACTIVE
     do i=current_state%local_grid%local_domain_start_index(x_index), current_state%local_grid%local_domain_end_index(x_index)
       do k=2,current_state%local_grid%size(z_index)
         current_state%p%data(k,y_halo_size+1,i)=current_state%p%data(k,y_halo_size+1,i)-&
              current_state%psrce_recv_buffer_y(k-1,i-y_halo_size)
       end do
     end do
 #endif

     combined_handles(1)=current_state%psrce_x_hs_send_request
     combined_handles(2)=current_state%psrce_y_hs_send_request
     call mpi_waitall(2, combined_handles, mpi_statuses_ignore, ierr)
   end subroutine complete_psrce_calculation

   subroutine tridiagonal_solver(current_state, pressure_term, fourier_space_sizes)
     type(model_state_type), target, intent(inout) :: current_state
     real(kind=DEFAULT_PRECISION), dimension(:,:,:), intent(inout) :: pressure_term
     integer, intent(in) :: fourier_space_sizes(3)

     integer :: i, j, k, j_start
     real(kind=DEFAULT_PRECISION) :: b(fourier_space_sizes(z_index)), b1(fourier_space_sizes(z_index)),   &
         s(fourier_space_sizes(z_index)), s1(fourier_space_sizes(z_index)), cij

     do i=1,fourier_space_sizes(x_index)
       j_start=merge(3, 1, current_state%local_grid%start(y_index) ==1 .and. current_state%local_grid%start(x_index) == 1 &
            .and. i .lt. 3)
       do j=j_start,fourier_space_sizes(y_index)

         cij=cos_x(i)+cos_y(j)
         b(2)=cij-current_state%global_grid%configuration%vertical%cza(2)
         b1(2)=1.0_default_precision/b(2)
         s1(2)=pressure_term(2,j,i)

         do k=3,fourier_space_sizes(z_index)
            b(k)=cij+current_state%global_grid%configuration%vertical%czg(k)
            b1(k)=1.0_default_precision/(b(k)-current_state%global_grid%configuration%vertical%czh(k)*b1(k-1))
            s1(k)=pressure_term(k,j,i)-current_state%global_grid%configuration%vertical%czb(k)*s1(k-1)*b1(k-1)
         end do

         pressure_term(fourier_space_sizes(z_index),j,i)=s1(fourier_space_sizes(z_index))* b1(fourier_space_sizes(z_index))

         do k=fourier_space_sizes(z_index)-1,2,-1
           pressure_term(k,j,i)=(s1(k)-current_state%global_grid%configuration%vertical%cza(k)*&
                pressure_term(k+1,j,i))*b1(k)
         end do
       end do
     end do

     ! Handle the zero wavenumber, which will only be on processes where the X and Y  dimension starts at 1
     if (current_state%local_grid%start(y_index) == 1 .and. current_state%local_grid%start(x_index) == 1) then
       do i=1,2
         do j=1,2
           s(2)=pressure_term(2,j,i)
           pressure_term(1,j,i)=0.0_default_precision
           pressure_term(2,j,i)=0.0_default_precision
           do k=3, fourier_space_sizes(z_index)
             s(k)=pressure_term(k,j,i)
             pressure_term(k,j,i)=(s(k-1)-current_state%global_grid%configuration%vertical%czg(k-1)*pressure_term(k-1,j,i)-&
                  current_state%global_grid%configuration%vertical%czb(k-1)*pressure_term(k-2,j,i))/&
                  current_state%global_grid%configuration%vertical%cza(k-1)
           end do
         end do
       end do
     end if
   end subroutine tridiagonal_solver

   subroutine copy_p_to_halo_buffer(current_state, neighbour_description, dim, source_index, &
        pid_location, current_page, source_data)
     type(model_state_type), intent(inout) :: current_state
     integer, intent(in) :: dim, pid_location, source_index
     integer, intent(inout) :: current_page(:)
     type(neighbour_description_type), intent(inout) :: neighbour_description
     type(field_data_wrapper_type), dimension(:), intent(in), optional :: source_data

     call copy_field_to_buffer(current_state%local_grid, neighbour_description%send_halo_buffer, current_state%p%data, &
          dim, source_index, current_page(pid_location))

     current_page(pid_location)=current_page(pid_location)+1
   end subroutine copy_p_to_halo_buffer

   !! @param dim The dimension we receive for
   !! @param target_index The target index for the dimension we are receiving for
   !! @param neighbour_location The location in the local neighbour data stores of this neighbour
   !! @param current_page The current, next, halo swap page to read from (all previous have been read and copied already)
   !! @param source_data Optional source data which is written into
   subroutine copy_halo_buffer_to_p(current_state, neighbour_description, dim, target_index, &
        neighbour_location, current_page, source_data)
     type(model_state_type), intent(inout) :: current_state
     integer, intent(in) :: dim, target_index, neighbour_location
     integer, intent(inout) :: current_page(:)
     type(neighbour_description_type), intent(inout) :: neighbour_description
     type(field_data_wrapper_type), dimension(:), intent(in), optional :: source_data

     call copy_buffer_to_field(current_state%local_grid, neighbour_description%recv_halo_buffer, current_state%p%data, &
          dim, target_index, current_page(neighbour_location))

     current_page(neighbour_location)=current_page(neighbour_location)+1
   end subroutine copy_halo_buffer_to_p

   subroutine perform_local_data_copy_for_p(current_state, halo_depth, involve_corners, source_data)
     type(model_state_type), intent(inout) :: current_state
     integer, intent(in) :: halo_depth
     logical, intent(in) :: involve_corners
     type(field_data_wrapper_type), dimension(:), intent(in), optional :: source_data

     call perform_local_data_copy_for_field(current_state%p%data, current_state%local_grid, &
          current_state%parallel%my_rank, halo_depth, involve_corners)
   end subroutine perform_local_data_copy_for_p
 end module fftsolver_mod
fftsolver_mod::tridiagonal_solver
subroutine tridiagonal_solver(current_state, pressure_term, fourier_space_sizes)
The tridiagonal solver which runs in Fourier space on the pressure terms. Note that because we are go...
Definition: fftsolver.F90:189

halo_communication_mod::init_halo_communication
subroutine, public init_halo_communication(current_state, get_fields_per_halo_cell, halo_state, halo_depth, involve_corners)
Initialises a halo swapping state, by determining the neighbours, size of data in each swap and alloc...
Definition: halocommunication.F90:295

halo_communication_mod::blocking_halo_swap
subroutine, public blocking_halo_swap(current_state, halo_swap_state, copy_to_halo_buffer, perform_local_data_copy, copy_from_halo_buffer, copy_corners_to_halo_buffer, copy_from_halo_buffer_to_corner, source_data)
Performs the entire halo swap operation, this is simply a wrapper around the nonblocking initiate and...
Definition: halocommunication.F90:112

fftsolver_mod::perform_local_data_copy_for_p
subroutine perform_local_data_copy_for_p(current_state, halo_depth, involve_corners, source_data)
Does local data copying for P variable halo swap.
Definition: fftsolver.F90:285

halo_communication_mod::perform_local_data_copy_for_field
subroutine, public perform_local_data_copy_for_field(field_data, local_grid, my_rank, halo_depth, involve_corners)
Will perform a a local copy for the halo data of a field.
Definition: halocommunication.F90:483

logging_mod::log_error
integer, parameter, public log_error
Only log ERROR messages.
Definition: logging.F90:11

communication_types_mod
Contains the types used for communication, holding the state of communications and supporting activit...
Definition: communicationtypes.F90:5

pencil_fft_mod::finalise_pencil_fft
subroutine, public finalise_pencil_fft(monc_communicator)
Cleans up allocated buffer memory.
Definition: pencilfft.F90:93

logging_mod
Logging utility.
Definition: logging.F90:2

fftsolver_mod
Pressure solver which uses a tridiagonal algorithm operating on the pressure terms in Fourier space...
Definition: fftsolver.F90:3

fftsolver_mod::halo_swap_state
type(halo_communication_type), save halo_swap_state
Definition: fftsolver.F90:25

datadefn_mod::default_precision
integer, parameter, public default_precision
MPI communication type which we use for the prognostic and calculation data.
Definition: datadefn.F90:17

grids_mod::z_index
integer, parameter, public z_index
Grid index parameters.
Definition: grids.F90:14

fftsolver_mod::complete_psrce_calculation
subroutine complete_psrce_calculation(current_state, y_halo_size, x_halo_size)
Completes the psrce calculation by waiting on all outstanding psrce communications to complete and th...
Definition: fftsolver.F90:145

fftsolver_mod::initialisation_callback
subroutine initialisation_callback(current_state)
This initialisation callback sets up the pencil fft module, allocates data for the fourier space pres...
Definition: fftsolver.F90:43

datadefn_mod
Contains common definitions for the data and datatypes used by MONC.
Definition: datadefn.F90:2

state_mod::model_state_type
The ModelState which represents the current state of a run.
Definition: state.F90:39

registry_mod::is_component_enabled
logical function, public is_component_enabled(options_database, component_name)
Determines whether or not a specific component is registered and enabled.
Definition: registry.F90:334

logging_mod::log_master_log
subroutine, public log_master_log(level, message)
Will log just from the master process.
Definition: logging.F90:47

monc_component_mod::component_descriptor_type
Description of a component.
Definition: monc_component.F90:42

halo_communication_mod::copy_buffer_to_field
subroutine, public copy_buffer_to_field(local_grid, halo_buffer, field_data, dim, target_index, halo_page)
Copies the received buffer for a specific field to the corresponding halo data of that prognostic fie...
Definition: halocommunication.F90:401

pencil_fft_mod::perform_forward_3dfft
subroutine, public perform_forward_3dfft(current_state, source_data, target_data)
Performs a forward 3D FFT and currently results in target data which is the X, Z, Y oriented pencil N...
Definition: pencilfft.F90:115

fftsolver_mod::pi
real(kind=default_precision) pi
Definition: fftsolver.F90:22

pencil_fft_mod::initialise_pencil_fft
integer function, dimension(3), public initialise_pencil_fft(current_state, my_y_start, my_x_start)
Initialises the pencil FFT functionality, this will create the transposition structures needed...
Definition: pencilfft.F90:52

communication_types_mod::halo_communication_type
Maintains the state of a halo swap and contains buffers, neighbours etc.
Definition: communicationtypes.F90:28

halo_communication_mod::get_single_field_per_halo_cell
integer function, public get_single_field_per_halo_cell(current_state)
A very common function, which returns a single field per halo cell which is used to halo swap just on...
Definition: halocommunication.F90:1230

monc_component_mod
Interfaces and types that MONC components must specify.
Definition: monc_component.F90:6

fftsolver_mod::copy_p_to_halo_buffer
subroutine copy_p_to_halo_buffer(current_state, neighbour_description, dim, source_index, pid_location, current_page, source_data)
Copies the p field data to halo buffers for a specific process in a dimension and halo cell...
Definition: fftsolver.F90:250

halo_communication_mod
Provides the mechanism for halo swapping. This module contains the functionality required to determin...
Definition: halocommunication.F90:8

pencil_fft_mod::perform_backwards_3dfft
subroutine, public perform_backwards_3dfft(current_state, source_data, target_data)
Performs a backwards 3D FFT and currently results in target data which is the X, Z, Y oriented pencil Note that the source_data here takes no account for the halo, it is up to caller to exclude this. This does no FFT in Z, but transposes to Y, does FFT in Y, then transposes to X and performs an FFT in that dimension. Pencil decomposition is used which has already been set up.
Definition: pencilfft.F90:138

communication_types_mod::neighbour_description_type
Describes the neighbours of a process in a specific dimension and contains the communication buffers ...
Definition: communicationtypes.F90:20

halo_communication_mod::copy_field_to_buffer
subroutine, public copy_field_to_buffer(local_grid, halo_buffer, field_data, dim, source_index, halo_page)
Copies prognostic field data to send buffer for specific field, dimension, halo cell.
Definition: halocommunication.F90:433

fftsolver_mod::fourier_space_sizes
integer, dimension(3) fourier_space_sizes
Definition: fftsolver.F90:24

communication_types_mod::field_data_wrapper_type
Definition: communicationtypes.F90:14

pencil_fft_mod
This Pencil FFT performs 3D forward and backwards FFTs using pencil decomposition. It uses FFTW for the actual FFT kernel and this module contains all the data decomposition around this. There is no FFT required in Z, so this performs FFTs in Y and X (in that order forward and reversed backwards.) The data decomposition is the complex aspect, there is the concept of forward and backwards transformations. Forward transformations will go from pencil Z to Y to X and the backwards transformations undo these, so go from X to Y to Z. Note that we use quite a lot of buffer space here, this could be cut down if Y=X dimensions so some optimisation on memory could be done there in that case.
Definition: pencilfft.F90:8

grids_mod
Functionality to support the different types of grid and abstraction between global grids and local o...
Definition: grids.F90:5

fftsolver_mod::timestep_callback
subroutine timestep_callback(current_state)
Timestep call back, which will transform to Fourier space, do a tridiagonal solve and then back into ...
Definition: fftsolver.F90:87

halo_communication_mod::finalise_halo_communication
subroutine, public finalise_halo_communication(halo_swap_state)
Finalises the halo swap represented by the state by freeing up all the allocated memory.
Definition: halocommunication.F90:340

fftsolver_mod::pt
real(kind=default_precision), dimension(:,:,:), allocatable pt
Definition: fftsolver.F90:23

fftsolver_mod::fftsolver_get_descriptor
type(component_descriptor_type) function, public fftsolver_get_descriptor()
Descriptor of this component for registration.
Definition: fftsolver.F90:33

fftsolver_mod::copy_halo_buffer_to_p
subroutine copy_halo_buffer_to_p(current_state, neighbour_description, dim, target_index, neighbour_location, current_page, source_data)
Definition: fftsolver.F90:269

state_mod
The model state which represents the current state of a run.
Definition: state.F90:2

fftsolver_mod::finalisation_callback
subroutine finalisation_callback(current_state)
Called at MONC finalisation, will call to the pencil fft module to clean itself up and free the press...
Definition: fftsolver.F90:131

fftsolver_mod::cos_x
real(kind=default_precision), dimension(:), allocatable cos_x
Definition: fftsolver.F90:21

grids_mod::y_index
integer, parameter, public y_index
Definition: grids.F90:14

grids_mod::x_index
integer, parameter, public x_index
Definition: grids.F90:14

fftsolver_mod::cos_y
real(kind=default_precision), dimension(:), allocatable cos_y
Definition: fftsolver.F90:21

registry_mod
MONC component registry.
Definition: registry.F90:5