main/doxygen_doc/current_8F90_source.html

!! Copyright (C) 2008-2019 X. Andrade, F. Bonafe, R. Jestaedt, H. Appel

!!

!! This program is free software; you can redistribute it and/or modify

!! it under the terms of the GNU General Public License as published by

!! the Free Software Foundation; either version 2, or (at your option)

!! any later version.

!!

!! This program is distributed in the hope that it will be useful,

!! but WITHOUT ANY WARRANTY; without even the implied warranty of

!! MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

!! GNU General Public License for more details.

!!

!! You should have received a copy of the GNU General Public License

!! along with this program; if not, write to the Free Software

!! Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA

!! 02110-1301, USA.

!!


#include "global.h"


module current_oct_m

  use accel_oct_m

  use batch_oct_m

  use batch_ops_oct_m

  use boundaries_oct_m

  use comm_oct_m

  use debug_oct_m

  use derivatives_oct_m

  use electron_space_oct_m

  use exchange_operator_oct_m

  use global_oct_m

  use grid_oct_m

  use hamiltonian_elec_oct_m

  use, intrinsic :: iso_fortran_env

  use ks_potential_oct_m

  use lalg_basic_oct_m

  use lda_u_oct_m

  use math_oct_m

  use magnetic_oct_m

  use mesh_function_oct_m

  use mesh_oct_m

  use messages_oct_m

  use namespace_oct_m

  use nonlocal_pseudopotential_oct_m

  use parser_oct_m

  use profiling_oct_m

  use projector_oct_m

  use scissor_oct_m

  use space_oct_m

  use states_elec_oct_m

  use states_elec_parallel_oct_m

  use types_oct_m

  use unit_oct_m

  use unit_system_oct_m

  use varinfo_oct_m

  use wfs_elec_oct_m

  use xc_oct_m


  implicit none


  private


  type current_t

    private

    integer :: method

    logical :: include_diamag

  end type current_t


  public ::                               &

    current_t,                            &

    current_init,                         &

    current_calculate,                    &

    current_calculate_mag,                &

    current_heat_calculate,               &

    current_calculate_mel


  integer, parameter, public ::           &

    CURRENT_GRADIENT           = 1,       &

    current_gradient_corr      = 2,       &

    current_hamiltonian        = 3


contains


  subroutine current_init(this, namespace)

    type(current_t),   intent(out)   :: this

    type(namespace_t), intent(in)    :: namespace


    push_sub(current_init)


    !%Variable CurrentDensity

    !%Default gradient_corrected

    !%Type integer

    !%Section Hamiltonian

    !%Description

    !% This variable selects the method used to

    !% calculate the current density. For the moment this variable is

    !% for development purposes and users should not need to use

    !% it.

    !%Option gradient 1

    !% The calculation of current is done using the gradient operator. (Experimental)

    !%Option gradient_corrected 2

    !% The calculation of current is done using the gradient operator

    !% with additional corrections for the total current from non-local operators.

    !%Option hamiltonian 3

    !% The current density is obtained from the commutator of the

    !% Hamiltonian with the position operator. (Experimental)

    !%End


    call parse_variable(namespace, 'CurrentDensity', current_gradient_corr, this%method)

    if (.not. varinfo_valid_option('CurrentDensity', this%method)) call messages_input_error(namespace, 'CurrentDensity')

    if (this%method /= current_gradient_corr) then

      call messages_experimental("CurrentDensity /= gradient_corrected")

    end if


    !%Variable CalculateDiamagneticCurrent

    !%Default no

    !%Type logical

    !%Section Hamiltonian

    !%Description

    !% This variable decides whether the current density arising from the non-uniform

    !% vector potential, defined as:

    !% <math> \vec{J}_{dmc}(\vec{r}, t)=-\frac{e^2}{m_e c_0} n(\vec{r}, t) \vec{A}(\vec{r},t)$ </math>

    !% is included in the total current density.

    !%End

    call parse_variable(namespace, 'CalculateDiamagneticCurrent', .false., this%include_diamag)


    pop_sub(current_init)

  end subroutine current_init


  ! ---------------------------------------------------------


  subroutine current_batch_accumulate(st, der, ik, ib, psib, gpsib)

    type(states_elec_t), intent(inout) :: st

    type(derivatives_t), intent(inout) :: der

    integer,             intent(in)    :: ik

    integer,             intent(in)    :: ib

    type(wfs_elec_t),    intent(in)    :: psib

    class(wfs_elec_t),   intent(in)    :: gpsib(:)


    integer :: ist, idir, ii, ip, idim, bsize, gsize

    complex(real64), allocatable :: psi(:, :), gpsi(:, :)

    real(real64), allocatable :: current_tmp(:, :)

    complex(real64) :: c_tmp

    real(real64) :: ww

    real(real64), allocatable :: weight(:)

    type(accel_mem_t) :: buff_weight, buff_current

    type(accel_kernel_t), save :: kernel


    safe_allocate(psi(1:der%mesh%np_part, 1:st%d%dim))

    safe_allocate(gpsi(1:der%mesh%np_part, 1:st%d%dim))


    if (st%d%ispin == spinors .or. (psib%status() == batch_device_packed .and. der%dim /= 3)) then


      do idir = 1, der%dim

        do ist = states_elec_block_min(st, ib), states_elec_block_max(st, ib)


          ww = st%kweights(ik)*st%occ(ist, ik)

          if (abs(ww) <= m_epsilon) cycle


          do idim = 1, st%d%dim

            ii = st%group%psib(ib, ik)%inv_index((/ist, idim/))

            call batch_get_state(psib, ii, der%mesh%np, psi(:, idim))

            call batch_get_state(gpsib(idir), ii, der%mesh%np, gpsi(:, idim))

          end do


          if (st%d%ispin /= spinors) then

            !$omp parallel do

            do ip = 1, der%mesh%np

              st%current_kpt(ip, idir, ik) = st%current_kpt(ip, idir, ik) + ww*aimag(conjg(psi(ip, 1))*gpsi(ip, 1))

            end do

            !$omp end parallel do

          else

            !$omp parallel do private(c_tmp)

            do ip = 1, der%mesh%np

              st%current_para(ip, idir, 1) = st%current_para(ip, idir, 1) + ww*aimag(conjg(psi(ip, 1))*gpsi(ip, 1))

              st%current_para(ip, idir, 2) = st%current_para(ip, idir, 2) + ww*aimag(conjg(psi(ip, 2))*gpsi(ip, 2))

              c_tmp = -m_half*(conjg(psi(ip, 2))*gpsi(ip, 1) - psi(ip, 1)*conjg(gpsi(ip, 2)))

              st%current_para(ip, idir, 3) = st%current_para(ip, idir, 3) - ww*aimag(c_tmp)

              st%current_para(ip, idir, 4) = st%current_para(ip, idir, 4) + ww*real(c_tmp, real64)

            end do

            !$omp end parallel do

          end if


        end do

      end do


    else if (psib%status() == batch_device_packed) then


      assert(der%dim == 3)


      safe_allocate(weight(1:psib%nst))

      do ist = 1, psib%nst

        weight(ist) = st%kweights(ik)*st%occ(psib%ist(ist), ik)

      end do


      call accel_create_buffer(buff_weight, accel_mem_read_only, type_float, psib%nst)

      call accel_write_buffer(buff_weight, psib%nst, weight, async=.true.)


      call accel_create_buffer(buff_current, accel_mem_write_only, type_float, der%mesh%np*3)


      call accel_kernel_start_call(kernel, 'density.cu', 'current_accumulate')


      call accel_set_kernel_arg(kernel, 0, psib%nst)

      call accel_set_kernel_arg(kernel, 1, der%mesh%np)

      call accel_set_kernel_arg(kernel, 2, buff_weight)

      call accel_set_kernel_arg(kernel, 3, psib%ff_device)

      call accel_set_kernel_arg(kernel, 4, log2(int(psib%pack_size(1), int32)))

      call accel_set_kernel_arg(kernel, 5, gpsib(1)%ff_device)

      call accel_set_kernel_arg(kernel, 6, gpsib(2)%ff_device)

      call accel_set_kernel_arg(kernel, 7, gpsib(3)%ff_device)

      call accel_set_kernel_arg(kernel, 8, log2(int(gpsib(1)%pack_size(1), int32)))

      call accel_set_kernel_arg(kernel, 9, buff_current)


      ! Compute the grid size

      bsize = accel_kernel_block_size(kernel)

      call accel_grid_size(der%mesh%np, bsize, gsize)


      call accel_kernel_run(kernel, (/gsize/), (/bsize/))


      safe_allocate(current_tmp(1:der%mesh%np, 1:der%dim))


      call accel_read_buffer(buff_current, der%mesh%np, der%dim, current_tmp)


      call lalg_axpy(der%mesh%np, der%dim, m_one, current_tmp, st%current_kpt(:,:,ik))


      safe_deallocate_a(current_tmp)


      call accel_free_buffer(buff_weight)

      call accel_free_buffer(buff_current)


      safe_deallocate_a(weight)


    else


      assert(psib%is_packed() .eqv. gpsib(1)%is_packed())


      !$omp parallel private(ip, ist, ww, idir)

      do ii = 1, psib%nst

        ist = states_elec_block_min(st, ib) + ii - 1

        ww = st%kweights(ik)*st%occ(ist, ik)

        if (abs(ww) <= m_epsilon) cycle


        if (psib%is_packed()) then

          do idir = 1, der%dim

            !$omp do

            do ip = 1, der%mesh%np

              st%current_kpt(ip, idir, ik) = st%current_kpt(ip, idir, ik) &

                + ww*aimag(conjg(psib%zff_pack(ii, ip))*gpsib(idir)%zff_pack(ii, ip))

            end do

            !$omp end do nowait

          end do

        else

          do idir = 1, der%dim

            !$omp do

            do ip = 1, der%mesh%np

              st%current_kpt(ip, idir, ik) = st%current_kpt(ip, idir, ik) &

                + ww*aimag(conjg(psib%zff(ip, 1, ii))*gpsib(idir)%zff(ip, 1, ii))

            end do

            !$omp end do nowait

          end do

        end if

      end do

      !$omp end parallel


    end if


    safe_deallocate_a(psi)

    safe_deallocate_a(gpsi)


  end subroutine current_batch_accumulate


  ! ---------------------------------------------------------

  subroutine current_calculate(this, namespace, gr, hm, space, st)

    type(current_t),          intent(in)    :: this

    type(namespace_t),        intent(in)    :: namespace

    type(grid_t),             intent(inout) :: gr

    type(hamiltonian_elec_t), intent(inout) :: hm

    class(space_t),           intent(in)    :: space

    type(states_elec_t),      intent(inout) :: st


    call profiling_in("CURRENT_TOTAL")

    push_sub(current_calculate)


    call current_calculate_para(this, namespace, gr, hm, space, st)

    st%current = st%current_para


    if (this%include_diamag) then

      call current_calculate_dia_non_unif_vec_pot(gr%der, hm, st)

      st%current = st%current + st%current_dia

    end if


    call profiling_out("CURRENT_TOTAL")

    pop_sub(current_calculate)


  end subroutine current_calculate


  ! ---------------------------------------------------------

  subroutine current_calculate_dia_non_unif_vec_pot(der, hm, st)

    type(derivatives_t),      intent(inout) :: der

    type(hamiltonian_elec_t), intent(in)    :: hm

    type(states_elec_t),      intent(inout) :: st


    integer :: ispin, idir, ip


    call profiling_in("CURRENT_DIA_NON_UNIF_A")

    push_sub(current_calculate_dia_non_unif_vec_pot)


    st%current_dia = m_zero


    if(allocated(hm%hm_base%vector_potential)) then

      do ispin = 1, st%d%nspin

        do idir = 1, der%dim

          !$omp parallel do

          do ip = 1, der%mesh%np

            ! the vector potential is assumed to be devided by c_0 already

            st%current_dia(ip, idir, ispin) = st%current_dia(ip, idir, ispin) + &

              st%rho(ip, ispin)*hm%hm_base%vector_potential(idir, ip)

          end do

          !$omp end parallel do

        end do

      end do

    end if


    call profiling_out("CURRENT_DIA_NON_UNIF_A")

    pop_sub(current_calculate_dia_non_unif_vec_pot)


  end subroutine current_calculate_dia_non_unif_vec_pot


  ! ---------------------------------------------------------

  subroutine current_calculate_mag(der, st)

    type(derivatives_t),      intent(inout) :: der

    type(states_elec_t),      intent(inout) :: st


    real(real64), allocatable :: magnetization_density(:, :), curl_mag(:, :)


    call profiling_in("CURRENT_MAG")

    push_sub(current_calculate_mag)


    st%current_mag = m_zero


    if (st%d%ispin /= unpolarized) then

      safe_allocate(magnetization_density(1:der%mesh%np_part, 1:der%dim))

      safe_allocate(curl_mag(1:der%mesh%np_part, 1:der%dim))


      call magnetic_density(der%mesh, st%d, st%rho, magnetization_density)

      call dderivatives_curl(der, magnetization_density, curl_mag)


      call lalg_axpy(der%mesh%np, der%dim, m_half, curl_mag, st%current_mag(:, :, 1))


      safe_deallocate_a(magnetization_density)

      safe_deallocate_a(curl_mag)

    end if


    call profiling_out("CURRENT_MAG")

    pop_sub(current_calculate_mag)


  end subroutine current_calculate_mag


  ! ---------------------------------------------------------

  subroutine current_calculate_para(this, namespace, gr, hm, space, st)

    type(current_t),             intent(in)    :: this

    type(namespace_t),           intent(in)    :: namespace

    type(grid_t),                intent(inout) :: gr

    type(hamiltonian_elec_t),    intent(inout) :: hm

    class(space_t),              intent(in)    :: space

    type(states_elec_t), target, intent(inout) :: st


    integer :: ik, ist, idir, idim, ip, ib, ii, ispin

    complex(real64), allocatable :: gpsi(:, :, :), psi(:, :), hpsi(:, :), rhpsi(:, :), rpsi(:, :), hrpsi(:, :)

    type(wfs_elec_t) :: hpsib, rhpsib, rpsib, hrpsib, epsib

    class(wfs_elec_t), allocatable :: commpsib(:)

    real(real64) :: ww

    complex(real64) :: c_tmp


    call profiling_in("CURRENT_PARA")

    push_sub(current_calculate_para)


    ! spin not implemented or tested

    assert(all(ubound(st%current_para) == (/gr%np_part, gr%der%dim, st%d%nspin/)))

    assert(all(ubound(st%current_kpt) == (/gr%np, gr%der%dim, st%d%kpt%end/)))

    assert(all(lbound(st%current_kpt) == (/1, 1, st%d%kpt%start/)))


    safe_allocate(psi(1:gr%np_part, 1:st%d%dim))

    safe_allocate(gpsi(1:gr%np, 1:gr%der%dim, 1:st%d%dim))

    safe_allocate(hpsi(1:gr%np_part, 1:st%d%dim))

    safe_allocate(rhpsi(1:gr%np_part, 1:st%d%dim))

    safe_allocate(rpsi(1:gr%np_part, 1:st%d%dim))

    safe_allocate(hrpsi(1:gr%np_part, 1:st%d%dim))

    safe_allocate_type_array(wfs_elec_t, commpsib, (1:gr%der%dim))


    !$omp parallel private(idir, ip, ispin)

    do ik = st%d%kpt%start, st%d%kpt%end

      do idir = 1, gr%der%dim

        !$omp do

        do ip = 1, gr%np

          st%current_kpt(ip, idir, ik) = m_zero

        end do

        !$omp end do nowait

      end do

    end do

    do ispin = 1, st%d%nspin

      do idir = 1, gr%der%dim

        !$omp do

        do ip = 1, gr%np

          st%current_para(ip, idir, ispin) = m_zero

        end do

        !$omp end do nowait

      end do

    end do

    !$omp end parallel


    select case (this%method)


    case (current_hamiltonian)

      if (family_is_hybrid(hm%xc)) then

        if (.not. hm%exxop%useACE) then

          hm%exxop%st => st

          call states_elec_parallel_remote_access_start(hm%exxop%st)

        end if

      end if


      do ik = st%d%kpt%start, st%d%kpt%end

        ispin = st%d%get_spin_index(ik)

        do ib = st%group%block_start, st%group%block_end


          call st%group%psib(ib, ik)%do_pack(copy = .true.)


          call st%group%psib(ib, ik)%copy_to(hpsib)

          call st%group%psib(ib, ik)%copy_to(rhpsib)

          call st%group%psib(ib, ik)%copy_to(rpsib)

          call st%group%psib(ib, ik)%copy_to(hrpsib)


          call boundaries_set(gr%der%boundaries, gr, st%group%psib(ib, ik))

          call zhamiltonian_elec_apply_batch(hm, namespace, gr, st%group%psib(ib, ik), hpsib, set_bc = .false.)


          do idir = 1, gr%der%dim


            call batch_mul(gr%np, gr%x_t(:, idir), hpsib, rhpsib)

            call batch_mul(gr%np_part, gr%x_t(:, idir), st%group%psib(ib, ik), rpsib)


            call zhamiltonian_elec_apply_batch(hm, namespace, gr, rpsib, hrpsib, set_bc = .false.)


            do ist = states_elec_block_min(st, ib), states_elec_block_max(st, ib)

              ww = st%kweights(ik)*st%occ(ist, ik)

              if (ww <= m_epsilon) cycle


              do idim = 1, st%d%dim

                ii = st%group%psib(ib, ik)%inv_index((/ist, idim/))

                call batch_get_state(st%group%psib(ib, ik), ii, gr%np, psi(:, idim))

                call batch_get_state(hrpsib, ii, gr%np, hrpsi(:, idim))

                call batch_get_state(rhpsib, ii, gr%np, rhpsi(:, idim))

              end do


              if (st%d%ispin /= spinors) then

                !$omp parallel do

                do ip = 1, gr%np

                  st%current_kpt(ip, idir, ik) = st%current_kpt(ip, idir, ik) &

                    - ww*aimag(conjg(psi(ip, 1))*hrpsi(ip, 1) - conjg(psi(ip, 1))*rhpsi(ip, 1))

                end do

                !$omp end parallel do

              else

                !$omp parallel do  private(c_tmp)

                do ip = 1, gr%np

                  st%current_para(ip, idir, 1) = st%current_para(ip, idir, 1) + &

                    ww*aimag(conjg(psi(ip, 1))*hrpsi(ip, 1) - conjg(psi(ip, 1))*rhpsi(ip, 1))

                  st%current_para(ip, idir, 2) = st%current_para(ip, idir, 2) + &

                    ww*aimag(conjg(psi(ip, 2))*hrpsi(ip, 2) - conjg(psi(ip, 2))*rhpsi(ip, 2))

                  c_tmp = -m_half*m_zi*(conjg(psi(ip, 2))*hrpsi(ip, 1) - conjg(psi(ip, 2))*rhpsi(ip, 1) &

                    -psi(ip, 1)*conjg(hrpsi(ip, 2)) - psi(ip, 1)*conjg(rhpsi(ip, 2)))

                  st%current_para(ip, idir, 3) = st%current_para(ip, idir, 3) + ww*real(c_tmp, real64)

                  st%current_para(ip, idir, 4) = st%current_para(ip, idir, 4) + ww*aimag(c_tmp)

                end do

                !$omp end parallel do

              end if


            end do


          end do


          call st%group%psib(ib, ik)%do_unpack(copy = .false.)


          call hpsib%end()

          call rhpsib%end()

          call rpsib%end()

          call hrpsib%end()


        end do

      end do


      if (family_is_hybrid(hm%xc)) then

        if (.not. hm%exxop%useACE) then

          call states_elec_parallel_remote_access_stop(hm%exxop%st)

          nullify(hm%exxop%st)

        end if

      end if


    case (current_gradient, current_gradient_corr)


      if (this%method == current_gradient_corr .and. .not. family_is_mgga_with_exc(hm%xc) &

        .and. hm%theory_level /= hartree_fock &

        .and. hm%theory_level /= generalized_kohn_sham_dft &

        .and. hm%theory_level /= rdmft &

        .and. hm%vnl%apply_projector_matrices) then


        ! we can use the packed version


        do ik = st%d%kpt%start, st%d%kpt%end

          ispin = st%d%get_spin_index(ik)

          do ib = st%group%block_start, st%group%block_end


            ! copy st%group%psib(ib, ik) to epsib and set the phase

            call hm%phase%copy_and_set_phase(gr, st%d%kpt, st%group%psib(ib, ik), epsib)


            ! this now takes non-orthogonal axis into account

            call zderivatives_batch_grad(gr%der, epsib, commpsib, set_bc=.false.)


            call hm%vnl%zposition_commutator(gr, st%d, gr%der%boundaries%spiral, epsib, commpsib, async=.true.)


            call zlda_u_commute_r(hm%lda_u, gr, space, st%d, namespace, epsib, commpsib)


            call current_batch_accumulate(st, gr%der, ik, ib, epsib, commpsib)


            do idir = 1, gr%der%dim

              call commpsib(idir)%end()

            end do


            call epsib%end()


            call accel_finish()

          end do

        end do


      else


        ! use the slow non-packed version


        do ik = st%d%kpt%start, st%d%kpt%end

          ispin = st%d%get_spin_index(ik)

          do ist = st%st_start, st%st_end


            ww = st%kweights(ik)*st%occ(ist, ik)

            if (abs(ww) <= m_epsilon) cycle


            call states_elec_get_state(st, gr, ist, ik, psi)


            if (hm%phase%is_allocated()) then

              call hm%phase%apply_to_single(psi, gr%np, st%d%dim, ik, .false.)

              ! apply phase correction while setting boundary -> memory needs to be

              ! accessed only once

              do idim = 1, st%d%dim

                call boundaries_set(gr%der%boundaries, gr, psi(:, idim), phase_correction = hm%phase%phase_corr(:, ik), &

                  buff_phase_corr = hm%phase%buff_phase_corr, offset=int((ik-st%d%kpt%start)*(gr%np_part-gr%np)))

              end do

            else

              do idim = 1, st%d%dim

                call boundaries_set(gr%der%boundaries, gr, psi(:, idim))

              end do

            end if


            do idim = 1, st%d%dim

              call zderivatives_grad(gr%der, psi(:, idim), gpsi(:, :, idim), set_bc = .false.)

            end do


            if (this%method == current_gradient_corr) then

              !A nonlocal contribution from the MGGA potential must be included

              !This must be done first, as this is like a position-dependent mass

              call hm%ks_pot%zcurrent_mass_renormalization(gpsi, gr%der%dim, st%d%dim, ispin)


              !A nonlocal contribution from the pseudopotential must be included

              call zprojector_commute_r_allatoms_alldir(hm%ep%proj, hm%ions, gr, st%d%dim, &

                gr%der%boundaries, ik, psi, gpsi)

              !A nonlocal contribution from the scissor must be included

              if (hm%scissor%apply) then

                call scissor_commute_r(hm%scissor, gr, ik, psi, gpsi)

              end if


              call zlda_u_commute_r_single(hm%lda_u, gr, space, st%d, namespace, ist, ik, &

                psi, gpsi, hm%phase%is_allocated())


              call zexchange_operator_commute_r(hm%exxop, namespace, gr, st%d, ik, psi, gpsi)


            end if


            if (st%d%ispin /= spinors) then

              do idir = 1, gr%der%dim

                !$omp parallel do

                do ip = 1, gr%np

                  st%current_kpt(ip, idir, ik) = st%current_kpt(ip, idir, ik) + &

                    ww*aimag(conjg(psi(ip, 1))*gpsi(ip, idir, 1))

                end do

                !$omp end parallel do

              end do

            else

              do idir = 1, gr%der%dim

                !$omp parallel do  private(c_tmp)

                do ip = 1, gr%np

                  st%current_para(ip, idir, 1) = st%current_para(ip, idir, 1) + &

                    ww*aimag(conjg(psi(ip, 1))*gpsi(ip, idir, 1))

                  st%current_para(ip, idir, 2) = st%current_para(ip, idir, 2) + &

                    ww*aimag(conjg(psi(ip, 2))*gpsi(ip, idir, 2))

                  c_tmp = -m_half*m_zi*(conjg(psi(ip, 2))*gpsi(ip, idir, 1) - psi(ip, 1)*conjg(gpsi(ip, idir, 2)))

                  st%current_para(ip, idir, 3) = st%current_para(ip, idir, 3) + ww*real(c_tmp, real64)

                  st%current_para(ip, idir, 4) = st%current_para(ip, idir, 4) + ww*aimag(c_tmp)

                end do

                !$omp end parallel do

              end do

            end if


          end do

        end do


      end if


    case default


      assert(.false.)


    end select


    if (st%d%ispin /= spinors) then

      !We sum the current over k-points

      do ik = st%d%kpt%start, st%d%kpt%end

        ispin = st%d%get_spin_index(ik)

        call lalg_axpy(gr%np, gr%der%dim, m_one, st%current_kpt(:, :, ik), st%current_para(:, :, ispin))

      end do

    end if


    if (st%parallel_in_states .or. st%d%kpt%parallel) then

      call comm_allreduce(st%st_kpt_mpi_grp, st%current_para, dim = (/gr%np, gr%der%dim, st%d%nspin/))

    end if


    if (st%symmetrize_density) then

      do ispin = 1, st%d%nspin

        call dgrid_symmetrize_vector_field(gr, st%current_para(:, :, ispin), suppress_warning = .true.)

      end do

    end if


    safe_deallocate_a(gpsi)

    safe_deallocate_a(psi)

    safe_deallocate_a(hpsi)

    safe_deallocate_a(rhpsi)

    safe_deallocate_a(rpsi)

    safe_deallocate_a(hrpsi)

    safe_deallocate_a(commpsib)


    call profiling_out("CURRENT_PARA")

    pop_sub(current_calculate_para)


  end subroutine current_calculate_para


  ! ---------------------------------------------------------

  ! Calculate the current matrix element between two states

  ! I_{ij}(t) = <i| J(t) |j>

  ! This is used only in the floquet_observables utility and

  ! is highly experimental


  subroutine current_calculate_mel(der, hm, psi_i, psi_j, ik,  cmel)

    type(derivatives_t),  intent(inout)    :: der

    type(hamiltonian_elec_t),  intent(in)  :: hm

    complex(real64),      intent(in)       :: psi_i(:,:)

    complex(real64),      intent(in)       :: psi_j(:,:)

    integer,              intent(in)       :: ik

    complex(real64),      intent(out)      :: cmel(:,:) ! the current vector cmel(1:der%dim, 1:st%d%nspin)


    integer ::  idir, idim, ispin

    complex(real64), allocatable :: gpsi_j(:, :, :), ppsi_j(:,:),  gpsi_i(:, :, :), ppsi_i(:,:)


    push_sub(current_calculate_mel)


    safe_allocate(gpsi_i(1:der%mesh%np, 1:der%dim, 1:hm%d%dim))

    safe_allocate(ppsi_i(1:der%mesh%np_part,1:hm%d%dim))

    safe_allocate(gpsi_j(1:der%mesh%np, 1:der%dim, 1:hm%d%dim))

    safe_allocate(ppsi_j(1:der%mesh%np_part,1:hm%d%dim))


    cmel = m_z0


    ispin = hm%d%get_spin_index(ik)

    ppsi_i(:,:) = m_z0

    ppsi_i(1:der%mesh%np,:) = psi_i(1:der%mesh%np,:)

    ppsi_j(:,:) = m_z0

    ppsi_j(1:der%mesh%np,:) = psi_j(1:der%mesh%np,:)


    do idim = 1, hm%d%dim

      call boundaries_set(der%boundaries, der%mesh, ppsi_i(:, idim))

      call boundaries_set(der%boundaries, der%mesh, ppsi_j(:, idim))

    end do


    if (hm%phase%is_allocated()) then

      ! Apply the phase that contains both the k-point and vector-potential terms.

      call hm%phase%apply_to_single(ppsi_i, der%mesh%np_part, hm%d%dim, ik, .false.)

      call hm%phase%apply_to_single(ppsi_j, der%mesh%np_part, hm%d%dim, ik, .false.)

    end if


    do idim = 1, hm%d%dim

      call zderivatives_grad(der, ppsi_i(:, idim), gpsi_i(:, :, idim), set_bc = .false.)

      call zderivatives_grad(der, ppsi_j(:, idim), gpsi_j(:, :, idim), set_bc = .false.)

    end do


    !A nonlocal contribution from the MGGA potential must be included

    !This must be done first, as this is like a position-dependent mass

    call hm%ks_pot%zcurrent_mass_renormalization(gpsi_i, der%dim, hm%d%dim, ispin)

    call hm%ks_pot%zcurrent_mass_renormalization(gpsi_j, der%dim, hm%d%dim, ispin)


    !A nonlocal contribution from the pseudopotential must be included

    call zprojector_commute_r_allatoms_alldir(hm%ep%proj, hm%ions, der%mesh, hm%d%dim, &

      der%boundaries, ik, ppsi_i, gpsi_i)

    call zprojector_commute_r_allatoms_alldir(hm%ep%proj, hm%ions, der%mesh, hm%d%dim, &

      der%boundaries, ik, ppsi_j, gpsi_j)

    !A nonlocal contribution from the scissor must be included

    if (hm%scissor%apply) then

      call scissor_commute_r(hm%scissor, der%mesh, ik, ppsi_i, gpsi_i)

      call scissor_commute_r(hm%scissor, der%mesh, ik, ppsi_j, gpsi_j)

    end if


    do idir = 1, der%dim


      do idim = 1, hm%d%dim


        cmel(idir,ispin) = m_zi * zmf_dotp(der%mesh, psi_i(:, idim), gpsi_j(:, idir,idim), reduce = .false.)

        cmel(idir,ispin) = cmel(idir,ispin) - m_zi * zmf_dotp(der%mesh, gpsi_i(:, idir, idim), psi_j(:, idim), reduce = .false.)


      end do

    end do


    call der%mesh%allreduce(cmel)


    safe_deallocate_a(gpsi_i)

    safe_deallocate_a(ppsi_i)

    safe_deallocate_a(gpsi_j)

    safe_deallocate_a(ppsi_j)


    pop_sub(current_calculate_mel)


  end subroutine current_calculate_mel


  ! ---------------------------------------------------------

  subroutine current_heat_calculate(space, der, hm, st, current)

    class(space_t),           intent(in)    :: space

    type(derivatives_t),      intent(in)    :: der

    type(hamiltonian_elec_t), intent(in)    :: hm

    type(states_elec_t),      intent(in)    :: st

    real(real64),             intent(out)   :: current(:, :, :)


    integer :: ik, ist, idir, idim, ip, ispin, ndim

    complex(real64), allocatable :: gpsi(:, :, :), psi(:, :), g2psi(:, :, :, :)

    complex(real64) :: tmp


    push_sub(current_heat_calculate)


    assert(space%is_periodic())

    assert(st%d%dim == 1)


    ndim = space%dim


    safe_allocate(psi(1:der%mesh%np_part, 1:st%d%dim))

    safe_allocate(gpsi(1:der%mesh%np_part, 1:ndim, 1:st%d%dim))

    safe_allocate(g2psi(1:der%mesh%np, 1:ndim, 1:ndim, 1:st%d%dim))


    do ip = 1, der%mesh%np

      current(ip, 1:ndim, 1:st%d%nspin) = st%current(ip, 1:ndim, 1:st%d%nspin)*hm%ep%vpsl(ip)

    end do


    do ik = st%d%kpt%start, st%d%kpt%end

      ispin = st%d%get_spin_index(ik)

      do ist = st%st_start, st%st_end


        if (abs(st%kweights(ik)*st%occ(ist, ik)) <= m_epsilon) cycle


        call states_elec_get_state(st, der%mesh, ist, ik, psi)

        do idim = 1, st%d%dim

          call boundaries_set(der%boundaries, der%mesh, psi(:, idim))

        end do


        if (hm%phase%is_allocated()) then

          call hm%phase%apply_to_single(psi, der%mesh%np_part, st%d%dim, ik, conjugate = .false.)

        end if


        do idim = 1, st%d%dim

          call zderivatives_grad(der, psi(:, idim), gpsi(:, :, idim), set_bc = .false.)

        end do

        do idir = 1, ndim

          if (hm%phase%is_allocated()) then

            call hm%phase%apply_to_single(gpsi(:, idir, :), der%mesh%np, st%d%dim, ik, conjugate = .true.)

          end if


          do idim = 1, st%d%dim

            call boundaries_set(der%boundaries, der%mesh, gpsi(:,idir, idim))

          end do


          if (hm%phase%is_allocated()) then

            call hm%phase%apply_to_single(gpsi(:, idir, :), der%mesh%np_part, st%d%dim, ik, conjugate = .false.)

          end if


          do idim = 1, st%d%dim

            call zderivatives_grad(der, gpsi(:, idir, idim), g2psi(:, :, idir, idim), set_bc = .false.)

          end do

        end do

        idim = 1

        do ip = 1, der%mesh%np

          do idir = 1, ndim

            tmp = sum(conjg(g2psi(ip, 1:ndim, idir, idim))*gpsi(ip, 1:ndim, idim)) - &

              sum(conjg(gpsi(ip, 1:ndim, idim))*g2psi(ip, 1:ndim, idir, idim))

            tmp = tmp - conjg(gpsi(ip, idir, idim))*sum(g2psi(ip, 1:ndim, 1:ndim, idim)) + &

              sum(conjg(g2psi(ip, 1:ndim, 1:ndim, idim)))*gpsi(ip, idir, idim)

            current(ip, idir, ispin) = current(ip, idir, ispin) + st%kweights(ik)*st%occ(ist, ik)*aimag(tmp)/8.0_real64

          end do

        end do

      end do

    end do


    pop_sub(current_heat_calculate)


  end subroutine current_heat_calculate


end module current_oct_m


!! Local Variables:

!! mode: f90

!! coding: utf-8

!! End:

accel_oct_m::accel_create_buffer
Definition: accel.F90:300

accel_oct_m::accel_grid_size
Definition: accel.F90:288

accel_oct_m::accel_kernel_run
Definition: accel.F90:304

accel_oct_m::accel_read_buffer
Definition: accel.F90:337

accel_oct_m::accel_set_kernel_arg
Definition: accel.F90:354

accel_oct_m::accel_write_buffer
Definition: accel.F90:312

batch_ops_oct_m::batch_get_state
Definition: batch_ops.F90:212

batch_ops_oct_m::batch_mul
Definition: batch_ops.F90:233

boundaries_oct_m::boundaries_set
Definition: boundaries.F90:217

comm_oct_m::comm_allreduce
Definition: comm.F90:131

lalg_basic_oct_m::lalg_axpy
constant times a vector plus a vector
Definition: lalg_basic.F90:173

math_oct_m::log2
Definition: math.F90:198

mesh_function_oct_m::zmf_dotp
Definition: mesh_function.F90:191

parser_oct_m::parse_variable
Definition: parser.F90:253

scissor_oct_m::scissor_commute_r
Definition: scissor.F90:157

states_elec_oct_m::states_elec_get_state
Definition: states_elec.F90:338

varinfo_oct_m::varinfo_valid_option
Definition: varinfo.F90:134

accel_oct_m
Definition: accel.F90:120

accel_oct_m::accel_kernel_block_size
integer function, public accel_kernel_block_size(kernel)
Definition: accel.F90:1188

accel_oct_m::accel_free_buffer
subroutine, public accel_free_buffer(this, async)
Definition: accel.F90:1005

accel_oct_m::accel_kernel_start_call
subroutine, public accel_kernel_start_call(this, file_name, kernel_name, flags)
Definition: accel.F90:1413

accel_oct_m::accel_finish
subroutine, public accel_finish()
Definition: accel.F90:1098

accel_oct_m::accel_mem_write_only
integer, parameter, public accel_mem_write_only
Definition: accel.F90:185

accel_oct_m::accel_mem_read_only
integer, parameter, public accel_mem_read_only
Definition: accel.F90:185

batch_oct_m
This module implements batches of mesh functions.
Definition: batch.F90:135

batch_oct_m::batch_device_packed
integer, parameter, public batch_device_packed
functions are stored in device memory in packed order
Definition: batch.F90:286

batch_ops_oct_m
This module implements common operations on batches of mesh functions.
Definition: batch_ops.F90:118

boundaries_oct_m
Module implementing boundary conditions in Octopus.
Definition: boundaries.F90:124

comm_oct_m
Definition: comm.F90:116

current_oct_m
Definition: current.F90:116

current_oct_m::current_batch_accumulate
subroutine current_batch_accumulate(st, der, ik, ib, psib, gpsib)
Definition: current.F90:229

current_oct_m::current_calculate_dia_non_unif_vec_pot
subroutine current_calculate_dia_non_unif_vec_pot(der, hm, st)
Compute diamagnetic current density from non-uniform vector potential (the part coming from the unifo...
Definition: current.F90:401

current_oct_m::current_calculate_mag
subroutine, public current_calculate_mag(der, st)
Compute magnetization current Note: due to the the numerical curl, the magnetization current could de...
Definition: current.F90:436

current_oct_m::current_hamiltonian
integer, parameter, public current_hamiltonian
Definition: current.F90:173

current_oct_m::current_gradient_corr
integer, parameter, public current_gradient_corr
Definition: current.F90:173

current_oct_m::current_heat_calculate
subroutine, public current_heat_calculate(space, der, hm, st, current)
Definition: current.F90:848

current_oct_m::current_calculate_para
subroutine current_calculate_para(this, namespace, gr, hm, space, st)
Compute paramagnetic current density (including full diamagnetic term if method = Hamiltonian us used...
Definition: current.F90:468

current_oct_m::current_calculate_mel
subroutine, public current_calculate_mel(der, hm, psi_i, psi_j, ik, cmel)
Definition: current.F90:766

current_oct_m::current_calculate
subroutine, public current_calculate(this, namespace, gr, hm, space, st)
Compute total electronic current density.
Definition: current.F90:373

current_oct_m::current_init
subroutine, public current_init(this, namespace)
Definition: current.F90:181

debug_oct_m
Definition: debug.F90:116

derivatives_oct_m
This module calculates the derivatives (gradients, Laplacians, etc.) of a function.
Definition: derivatives.F90:123

derivatives_oct_m::dderivatives_curl
subroutine, public dderivatives_curl(der, ff, op_ff, ghost_update, set_bc)
apply the curl operator to a vector of mesh functions
Definition: derivatives.F90:1362

derivatives_oct_m::zderivatives_batch_grad
subroutine, public zderivatives_batch_grad(der, ffb, opffb, ghost_update, set_bc, to_cartesian, factor)
apply the gradient to a batch of mesh functions
Definition: derivatives.F90:2406

derivatives_oct_m::zderivatives_grad
subroutine, public zderivatives_grad(der, ff, op_ff, ghost_update, set_bc, to_cartesian)
apply the gradient to a mesh function
Definition: derivatives.F90:2062

electron_space_oct_m
Definition: electron_space.F90:116

electron_space_oct_m::unpolarized
integer, parameter, public unpolarized
Parameters...
Definition: electron_space.F90:141

electron_space_oct_m::spinors
integer, parameter, public spinors
Definition: electron_space.F90:141

exchange_operator_oct_m
Definition: exchange_operator.F90:116

exchange_operator_oct_m::zexchange_operator_commute_r
subroutine, public zexchange_operator_commute_r(this, namespace, mesh, st_d, ik, psi, gpsi)
Definition: exchange_operator.F90:2702

global_oct_m
Definition: global.F90:116

global_oct_m::m_zero
real(real64), parameter, public m_zero
Definition: global.F90:191

global_oct_m::rdmft
integer, parameter, public rdmft
Definition: global.F90:241

global_oct_m::hartree_fock
integer, parameter, public hartree_fock
Definition: global.F90:241

global_oct_m::m_z0
complex(real64), parameter, public m_z0
Definition: global.F90:201

global_oct_m::generalized_kohn_sham_dft
integer, parameter, public generalized_kohn_sham_dft
Definition: global.F90:241

global_oct_m::m_zi
complex(real64), parameter, public m_zi
Definition: global.F90:205

global_oct_m::m_epsilon
real(real64), parameter, public m_epsilon
Definition: global.F90:207

global_oct_m::m_half
real(real64), parameter, public m_half
Definition: global.F90:197

global_oct_m::m_one
real(real64), parameter, public m_one
Definition: global.F90:192

grid_oct_m
This module implements the underlying real-space grid.
Definition: grid.F90:119

grid_oct_m::dgrid_symmetrize_vector_field
subroutine, public dgrid_symmetrize_vector_field(gr, field, suppress_warning)
Definition: grid.F90:698

hamiltonian_elec_oct_m
Definition: hamiltonian_elec.F90:117

hamiltonian_elec_oct_m::zhamiltonian_elec_apply_batch
subroutine, public zhamiltonian_elec_apply_batch(hm, namespace, mesh, psib, hpsib, terms, set_bc)
Definition: hamiltonian_elec.F90:2564

ks_potential_oct_m
A module to handle KS potential, without the external potential.
Definition: ks_potential.F90:121

lalg_basic_oct_m
Definition: lalg_basic.F90:116

lda_u_oct_m
Definition: lda_u.F90:116

lda_u_oct_m::zlda_u_commute_r
subroutine, public zlda_u_commute_r(this, mesh, space, d, namespace, psib, gpsib)
This routine computes [r,V_lda+u] .
Definition: lda_u.F90:5088

lda_u_oct_m::zlda_u_commute_r_single
subroutine, public zlda_u_commute_r_single(this, mesh, space, d, namespace, ist, ik, psi, gpsi, has_phase)
Definition: lda_u.F90:5037

magnetic_oct_m
Definition: magnetic.F90:116

magnetic_oct_m::magnetic_density
subroutine, public magnetic_density(mesh, std, rho, md)
Definition: magnetic.F90:164

math_oct_m
This module is intended to contain "only mathematical" functions and procedures.
Definition: math.F90:117

mesh_function_oct_m
This module defines various routines, operating on mesh functions.
Definition: mesh_function.F90:118

mesh_oct_m
This module defines the meshes, which are used in Octopus.
Definition: mesh.F90:120

messages_oct_m
Definition: messages.F90:117

messages_oct_m::messages_input_error
subroutine, public messages_input_error(namespace, var, details, row, column)
Definition: messages.F90:691

messages_oct_m::messages_experimental
subroutine, public messages_experimental(name, namespace)
Definition: messages.F90:1063

namespace_oct_m
Definition: namespace.F90:105

nonlocal_pseudopotential_oct_m
Definition: nonlocal_pseudopotential.F90:116

parser_oct_m
Definition: parser.F90:116

profiling_oct_m
Definition: profiling.F90:118

profiling_oct_m::profiling_out
subroutine, public profiling_out(label)
Increment out counter and sum up difference between entry and exit time.
Definition: profiling.F90:631

profiling_oct_m::profiling_in
subroutine, public profiling_in(label, exclude)
Increment in counter and save entry time.
Definition: profiling.F90:554

projector_oct_m
Definition: projector.F90:116

projector_oct_m::zprojector_commute_r_allatoms_alldir
subroutine, public zprojector_commute_r_allatoms_alldir(pj, ions, mesh, dim, bnd, ik, psi, cpsi)
This function calculates |cpsi> += [x, V_nl] |psi>
Definition: projector.F90:1758

scissor_oct_m
Definition: scissor.F90:115

space_oct_m
Definition: space.F90:116

states_elec_oct_m
Definition: states_elec.F90:115

states_elec_oct_m::states_elec_block_max
integer pure function, public states_elec_block_max(st, ib)
return index of last state in block ib
Definition: states_elec.F90:2601

states_elec_oct_m::states_elec_block_min
integer pure function, public states_elec_block_min(st, ib)
return index of first state in block ib
Definition: states_elec.F90:2591

states_elec_parallel_oct_m
This module provides routines for communicating states when using states parallelization.
Definition: states_elec_parallel.F90:121

states_elec_parallel_oct_m::states_elec_parallel_remote_access_stop
subroutine, public states_elec_parallel_remote_access_stop(this)
stop remote memory access for states on other processors
Definition: states_elec_parallel.F90:224

states_elec_parallel_oct_m::states_elec_parallel_remote_access_start
subroutine, public states_elec_parallel_remote_access_start(this)
start remote memory access for states on other processors
Definition: states_elec_parallel.F90:183

types_oct_m
Definition: types.F90:116

types_oct_m::type_float
type(type_t), public type_float
Definition: types.F90:135

unit_oct_m
brief This module defines the class unit_t which is used by the unit_systems_oct_m module.
Definition: unit.F90:134

unit_system_oct_m
This module defines the unit system, used for input and output.
Definition: unit_system.F90:128

varinfo_oct_m
Definition: varinfo.F90:116

wfs_elec_oct_m
Definition: wfs_elec.F90:116

xc_oct_m
Definition: xc.F90:116

xc_oct_m::family_is_mgga_with_exc
logical pure function, public family_is_mgga_with_exc(xcs)
Is the xc function part of the mGGA family with an energy functional.
Definition: xc.F90:593

xc_oct_m::family_is_hybrid
logical pure function, public family_is_hybrid(xcs)
Returns true if the functional is an hybrid functional.
Definition: xc.F90:608

current_oct_m::current_t
Definition: current.F90:158

derivatives_oct_m::derivatives_t
class representing derivatives
Definition: derivatives.F90:220

grid_oct_m::grid_t
Description of the grid, containing information on derivatives, stencil, and symmetries.
Definition: grid.F90:171

hamiltonian_elec_oct_m::hamiltonian_elec_t
Definition: hamiltonian_elec.F90:227

namespace_oct_m::namespace_t
Definition: namespace.F90:117

space_oct_m::space_t
Definition: space.F90:132

states_elec_oct_m::states_elec_t
The states_elec_t class contains all electronic wave functions.
Definition: states_elec.F90:229

wfs_elec_oct_m::wfs_elec_t
batches of electronic states
Definition: wfs_elec.F90:141

true
int true(void)
Definition: symmetries_finite.c:3150