Source code for pyscf.mcpdft.pdft_veff

#!/usr/bin/env python
# Copyright 2014-2022 The PySCF Developers. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#

from pyscf.lib import logger, current_memory, tag_array
from pyscf.dft.gen_grid import BLKSIZE
from pyscf.mcpdft.otpd import get_ontop_pair_density
from pyscf.mcpdft.pdft_eff import _ERIS
import numpy as np
import gc


# MRH 05/18/2020: An annoying convention in pyscf.dft.numint that I have to
# comply with is that the AO grid-value arrays and all their derivatives are in
# NEITHER column-major NOR row-major order; they all have ndim = 3 and strides
# of (8*ngrids*nao, 8, 8*ngrids). Here, for my ndim > 3 objects, I choose to
# generalize this so that a cyclic transpose to the left,
# ao.transpose (1,2,3,...,0), places the array in column-major (FORTRAN-style)
# order. I have to comply with this awkward convention in order to take full
# advantage of the code in pyscf.dft.numint and libdft.so. The ngrids
# dimension, which is by far the largest, almost always benefits from having
# the smallest stride.

# MRH 05/19/2020: Actually, I really should just turn the deriv component part
# of all of these arrays into lists and keep everything in col-major order
# otherwise, because ndarrays have to have regular strides, but lists can just
# be references and less copying is involved. The copying is more expensive and
# less transparently parallel-scalable than the actual math! (The
# parallel-scaling part of that is stupid but it is what it is.)


[docs]
def kernel(ot, dm1s, cascm2, mo_coeff, ncore, ncas,
           max_memory=2000, hermi=1, paaa_only=False, aaaa_only=False,
           jk_pc=False):
    '''Get the 1- and 2-body effective potential from MC-PDFT.

    Args:
        ot : an instance of otfnal class
        dm1s : ndarray of shape (2, nao, nao)
            containing spin-separated one-body density matrices
        cascm2 : ndarray of shape (ncas, ncas, ncas, ncas)
            containing spin-summed two-body cumulant density matrix in
            an active space
        mo_coeff : ndarray of shape (nao, nmo)
            containing molecular orbital coefficients
        ncore : integer
            number of inactive orbitals
        ncas : integer
            number of active orbitals

    Kwargs:
        max_memory : int or float
            maximum cache size in MB
            default is 2000
        hermi : int
            1 if 1rdms are assumed hermitian, 0 otherwise
        paaa_only : logical
            If true, only compute the paaa range of papa and ppaa
            (all other elements set to zero)
        aaaa_only : logical
            If true, only compute the aaaa range of papa and ppaa
            (all other elements set to zero; overrides paaa_only)
        jk_pc : logical
            If true, compute the ppii=pipi elements of veff2
            (otherwise, these are set to zero)

    Returns:
        veff1 : ndarray of shape (nao, nao)
            1-body effective potential
        veff2 : object of class pdft_eff._ERIS
            2-body effective potential and related quantities
    '''
    nocc = ncore + ncas
    ni, xctype, dens_deriv = ot._numint, ot.xctype, ot.dens_deriv
    nao = mo_coeff.shape[0]
    mo_core = mo_coeff[:, :ncore]
    mo_cas = mo_coeff[:, ncore:nocc]
    shls_slice = (0, ot.mol.nbas)
    ao_loc = ot.mol.ao_loc_nr()

    omega, alpha, hyb = ot._numint.rsh_and_hybrid_coeff(ot.otxc)
    hyb_x, hyb_c = hyb
    if abs(omega) > 1e-11:
        raise NotImplementedError("range-separated on-top functionals")

    if abs(hyb_x - hyb_c) > 1e-11:
        raise NotImplementedError(
            "effective potential for hybrid functionals with different exchange, correlations components")


    E_ot = 0.0
    veff1 = np.zeros((nao, nao), dtype=dm1s.dtype)
    veff2 = _ERIS(ot.mol, mo_coeff, ncore, ncas, paaa_only=paaa_only,
                  aaaa_only=aaaa_only, jk_pc=jk_pc, verbose=ot.verbose,
                  stdout=ot.stdout)

    t0 = (logger.process_clock(), logger.perf_counter())

    # Density matrices
    dm_core = mo_core @ mo_core.T
    dm_cas = dm1s - dm_core[None, :, :]
    dm_core *= 2

    # Propagate speedup tags
    if hasattr(dm1s, 'mo_coeff') and hasattr(dm1s, 'mo_occ'):
        dm_core = tag_array(dm_core, mo_coeff=dm1s.mo_coeff[0, :, :ncore],
                            mo_occ=dm1s.mo_occ[:, :ncore].sum(0))
        dm_cas = tag_array(dm_cas, mo_coeff=dm1s.mo_coeff[:, :, ncore:nocc],
                           mo_occ=dm1s.mo_occ[:, ncore:nocc])

    # rho generators
    make_rho_c = ni._gen_rho_evaluator(ot.mol, dm_core, hermi=hermi, with_lapl=False)[0]
    make_rho_a = ni._gen_rho_evaluator(ot.mol, dm_cas, hermi=hermi, with_lapl=False)[0]
    make_rho = ni._gen_rho_evaluator(ot.mol, dm1s, hermi=hermi, with_lapl=False)[0]

    # memory block size
    gc.collect()
    remaining_floats = (max_memory - current_memory()[0]) * 1e6 / 8
    nderiv_rho = (1, 4, 5)[dens_deriv]
    nderiv_Pi = (1, 4)[ot.Pi_deriv]
    nderiv_ao = (1,4,10)[dens_deriv]
    ncols = 4 + nderiv_rho * nao  # ao, weight, coords
    ncols += nderiv_rho * 4 + nderiv_Pi  # rho, rho_a, rho_c, Pi
    ncols += 1 + nderiv_rho + nderiv_Pi  # eot, vot

    # Asynchronous part
    nveff1 = nderiv_ao * (nao + 1)  # footprint of get_veff_1body
    nveff2 = veff2._accumulate_ftpt() * nderiv_Pi
    ncols += np.amax([nveff1, nveff2])  # asynchronous fns
    pdft_blksize = int(remaining_floats / (ncols * BLKSIZE)) * BLKSIZE
    if ot.grids.coords is None:
        ot.grids.build(with_non0tab=True)
    ngrids = ot.grids.coords.shape[0]
    ngrids_blk = int(ngrids / BLKSIZE) * BLKSIZE
    pdft_blksize = max(BLKSIZE, min(pdft_blksize, ngrids_blk, BLKSIZE * 1200))
    logger.debug(ot, ('{} MB used of {} available; block size of {} chosen'
                      'for grid with {} points').format(current_memory()[0], max_memory,
                                                        pdft_blksize, ngrids))

    # The actual loop
    for ao, mask, weight, coords in ni.block_loop(ot.mol, ot.grids, nao,
                                                  dens_deriv, max_memory, blksize=pdft_blksize):
        rho = np.asarray([make_rho(i, ao, mask, xctype) for i in range(2)])
        rho_a = sum([make_rho_a(i, ao, mask, xctype) for i in range(2)])
        rho_c = make_rho_c(0, ao, mask, xctype)
        t0 = logger.timer(ot, 'untransformed densities (core and total)', *t0)
        Pi = get_ontop_pair_density(ot, rho, ao, cascm2, mo_cas,
                                    deriv=ot.Pi_deriv, non0tab=mask)
        t0 = logger.timer(ot, 'on-top pair density calculation', *t0)
        eot, vot = ot.eval_ot(rho, Pi, weights=weight)[:2]
        E_ot += eot.dot(weight)
        vrho, vPi = vot
        t0 = logger.timer(ot, 'effective potential kernel calculation', *t0)
        if ao.ndim == 2: ao = ao[None, :, :]
        # TODO: consistent format req's ao LDA case
        veff1 += ot.get_eff_1body(ao, weight, kern=vrho, non0tab=mask,
                                   shls_slice=shls_slice, ao_loc=ao_loc, hermi=1)
        t0 = logger.timer(ot, '1-body effective potential calculation', *t0)
        veff2._accumulate(ot, ao, weight, rho_c, rho_a, vPi, mask,
                          shls_slice, ao_loc)
        t0 = logger.timer(ot, '2-body effective potential calculation', *t0)
    veff2._finalize()
    t0 = logger.timer(ot, 'Finalizing 2-body effective potential calculation',
                      *t0)
    return E_ot, veff1, veff2




[docs]
def lazy_kernel(ot, dm1s, cascm2, mo_cas, max_memory=2000, hermi=1,
                veff2_mo=None):
    '''Get the 1- and 2-body effective potential from MC-PDFT.
    Eventually I'll be able to specify mo slices for the 2-body part

    Args:
        ot : an instance of otfnal class
        dm1s : ndarray of shape (2, nao, nao)
            containing spin-separated one-body density matrices
        cascm2 : ndarray of shape (ncas, ncas, ncas, ncas)
            containing spin-summed two-body cumulant density matrix
            in an active space
        mo_cas : ndarray of shape (nao, ncas)
            containing molecular orbital coefficients for
            active-space orbitals

    Kwargs:
        max_memory : int or float
            maximum cache size in MB
            default is 2000
        hermi : int
            1 if 1rdms are assumed hermitian, 0 otherwise

    Returns : float
        The MC-PDFT on-top exchange-correlation energy
    '''
    if veff2_mo is not None:
        raise NotImplementedError('Molecular orbital slices for 2-body part')
    ni, xctype = ot._numint, ot.xctype
    dens_deriv = ot.dens_deriv
    Pi_deriv = ot.Pi_deriv
    nao = mo_cas.shape[0]

    veff1 = np.zeros_like(dm1s[0])
    veff2 = np.zeros((nao, nao, nao, nao), dtype=veff1.dtype)

    t0 = (logger.process_clock(), logger.perf_counter())
    make_rho = tuple(ni._gen_rho_evaluator(ot.mol, dm1s[i, :, :], hermi=hermi, with_lapl=False)
                     for i in range(2))
    for ao, mask, weight, coords in ni.block_loop(ot.mol, ot.grids, nao,
                                                  dens_deriv, max_memory):
        rho = np.asarray([m[0](0, ao, mask, xctype) for m in make_rho])
        t0 = logger.timer(ot, 'untransformed density', *t0)
        Pi = get_ontop_pair_density(ot, rho, ao, cascm2, mo_cas,
                                    deriv=Pi_deriv, non0tab=mask)
        t0 = logger.timer(ot, 'on-top pair density calculation', *t0)
        _, vot = ot.eval_ot(rho, Pi, weights=weight)[:2]
        vrho, vPi = vot
        t0 = logger.timer(ot, "effective potential kernel calculation", *t0)
        if ao.ndim == 2:
            ao = ao[None, :, :]
        # TODO: consistent format req's ao LDA case
        veff1 += ot.get_eff_1body(ao, weight, kern=vrho, non0tab=mask)
        t0 = logger.timer(ot, '1-body effective potential calculation', *t0)
        veff2 += ot.get_eff_2body(ao, weight, kern=vPi, aosym=1)
        t0 = logger.timer(ot, '2-body effective potential calculation', *t0)
    return veff1, veff2




[docs]
def get_veff_1body(otfnal, rho, Pi, ao, weight, kern=None, non0tab=None,
                   shls_slice=None, ao_loc=None, hermi=0, **kwargs):
    r''' get the derivatives dEot / dDpq
    Can also be abused to get semidiagonal dEot / dPppqq if you pass the
    right kern and squared aos/mos

    Args:
        rho : ndarray of shape (2,*,ngrids)
            containing spin-density [and derivatives]
        Pi : ndarray with shape (*,ngrids)
            containing on-top pair density [and derivatives]
        ao : ndarray or 2 ndarrays of shape (*,ngrids,nao)
            contains values and derivatives of nao.
            2 different ndarrays can have different nao but not
            different ngrids
        weight : ndarray of shape (ngrids)
            containing numerical integration weights

    Kwargs:
        kern : ndarray of shape (*,ngrids)
            the derivative of the on-top potential with respect to
            density (vrho)/ If not provided, it is calculated.
        non0tab : ndarray of shape (nblk, nbas)
            Identifies blocks of grid points which are nonzero on
            each AO shell so as to exploit sparsity.
            If you want the "ao" array to be in the MO basis, just
            leave this as None. If hermi == 0, it only applies
            to the bra index ao array, even if the ket index ao
            array is the same (so probably always pass hermi = 1
            in that case)
        shls_slice : sequence of integers of len 2
            Identifies starting and stopping indices of AO shells
        ao_loc : ndarray of length nbas
            Offset to first AO of each shell
        hermi : integer or logical
            Toggle whether veff is supposed to be a Hermitian matrix
            You can still pass two different ao arrays for the bra and
            the ket indices, for instance if one of them is supposed to
            be a higher derivative. They just have to have the same nao
            in that case.

    Returns : ndarray of shape (nao[0],nao[1])
        The 1-body effective potential corresponding to this on-top pair
        density exchange-correlation functional, in the atomic-orbital
        basis. In PDFT this functional is always spin-symmetric.
    '''

    if kern is None:
        if rho.ndim == 2:
            rho = np.expand_dims(rho, 1)
            Pi = np.expand_dims(Pi, 0)

        kern = otfnal.eval_ot(rho, Pi, dderiv=1, **kwargs)[1][1]
        rho = np.squeeze(rho)
        Pi = np.squeeze(Pi)

    return otfnal.get_eff_1body(ao, weight, kern=kern, non0tab=non0tab,
                                shls_slice=shls_slice, ao_loc=ao_loc,
                                hermi=hermi)




[docs]
def get_veff_2body(otfnal, rho, Pi, ao, weight, aosym='s4', kern=None,
                   vao=None, **kwargs):
    r''' get the derivatives dEot / dPijkl

    Args:
        rho : ndarray of shape (2,*,ngrids)
            containing spin-density [and derivatives]
        Pi : ndarray with shape (*,ngrids)
            containing on-top pair density [and derivatives]
        ao : ndarray of shape (*,ngrids,nao)
            OR list of ndarrays of shape (*,ngrids,*)
            values and derivatives of atomic or molecular orbitals in
            which space to calculate the 2-body veff
            If a list of length 4, the corresponding set of eri-like
            elements are returned
        weight : ndarray of shape (ngrids)
            containing numerical integration weights

    Kwargs:
        aosym : int or str
            Index permutation symmetry of the desired integrals. Valid
            options are 1 (or '1' or 's1'), 4 (or '4' or 's4'), '2ij'
            (or 's2ij'), and '2kl' (or 's2kl'). These have the same
            meaning as in PySCF's ao2mo module. Currently all symmetry
            exploitation is extremely slow and unparallelizable for some
            reason so trying to use this is not recommended until I come
            up with a C routine.
        kern : ndarray of shape (*,ngrids)
            the derivative of the on-top potential with respect to pair
            density (vot). If not provided, it is calculated.
        vao : ndarray of shape (*,ngrids,nao,nao) or
            (*,ngrids,nao*(nao+1)//2). An intermediate in which the
            kernel and the k,l orbital indices have been contracted.
            Overrides kl_symm

    Returns : eri-like ndarray
        The two-body effective potential corresponding to this on-top
        pair density exchange-correlation functional or elements
        thereof, in the provided basis.
    '''

    if kern is None:
        if rho.ndim == 2:
            rho = np.expand_dims(rho, 1)
            Pi = np.expand_dims(Pi, 0)

        kern = otfnal.eval_ot(rho, Pi, dderiv=1, **kwargs)[1][2]

    return otfnal.get_eff_2body(ao, weight, kern, aosym=aosym, eff_ao=vao)




[docs]
def get_veff_2body_kl(otfnal, rho, Pi, ao_k, ao_l, weight, symm=False,
                      kern=None, **kwargs):
    r''' get the two-index intermediate Mkl of dEot/dPijkl

    Args:
        rho : ndarray of shape (2,*,ngrids)
            containing spin-density [and derivatives]
        Pi : ndarray with shape (*,ngrids)
            containing on-top pair density [and derivatives]
        ao_k : ndarray of shape (*,ngrids,nao)
            OR list of ndarrays of shape (*,ngrids,*)
            values and derivatives of atomic or molecular orbitals
            corresponding to index k
        ao_l : ndarray of shape (*,ngrids,nao)
            OR list of ndarrays of shape (*,ngrids,*)
            values and derivatives of atomic or molecular orbitals
            corresponding to index l
        weight : ndarray of shape (ngrids)
            containing numerical integration weights

    Kwargs:
        symm : logical
            Index permutation symmetry of the desired integral wrt k,l
        kern : ndarray of shape (*,ngrids)
            the derivative of the on-top potential with respect to pair
            density (vot). If not provided, it is calculated.

    Returns : ndarray of shape (*,ngrids,nao,nao)
        or (*,ngrids,nao*(nao+1)//2). An intermediate for calculating
        the two-body effective potential corresponding to this on-top
        pair density exchange-correlation functional in the provided
        basis.
    '''

    if kern is None:
        if rho.ndim == 2:
            rho = np.expand_dims(rho, 1)
            Pi = np.expand_dims(Pi, 0)

        kern = otfnal.eval_ot(rho, Pi, dderiv=1, **kwargs)[1][2]
    return otfnal.get_eff_2body_kl(ao_k, ao_l, weight, kern=kern, symm=symm)