Skip to content

Commit

Permalink
Bug fix for looping over states and adding DF
Browse files Browse the repository at this point in the history
  • Loading branch information
Bhavnesh Jangid committed Aug 9, 2024
1 parent 63e5223 commit 1c4970a
Showing 1 changed file with 61 additions and 88 deletions.
149 changes: 61 additions & 88 deletions my_pyscf/mcpdft/laspdft.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,10 +13,9 @@
try:
from pyscf.mcpdft.mcpdft import _PDFT, _mcscf_env
except ImportError:
msg = "For performing LASPDFT, you will require pyscf-forge.\n" + \
"pyscf-forge can be found at : https://github.com/pyscf/pyscf-forge"
raise ImportError(msg)

msg = "For performing LASPDFT, you will require pyscf-forge.\n" +\
"pyscf-forge can be found at : https://github.com/pyscf/pyscf-forge"
raise ImportError(msg)

def make_casdm1s(filename, i):
'''
Expand All @@ -28,7 +27,6 @@ def make_casdm1s(filename, i):
rdm1s = np.array(rdm1s)
return rdm1s


def make_casdm2s(filename, i):
'''
This function stores the rdm2s for the given state 'i' in a tempfile
Expand All @@ -39,26 +37,26 @@ def make_casdm2s(filename, i):
rdm2s = np.array(rdm2s)
return rdm2s


class _LASPDFT(_PDFT):
'MC-PDFT energy for a LASSCF wavefunction'

def get_h2eff(self, mo_coeff=None):
'Compute the active space two-particle Hamiltonian.'
ncore = self.ncore
ncas = self.ncas
nocc = ncore + ncas
if mo_coeff is None:
mo_coeff = self.mo_coeff[:, ncore:nocc]
elif mo_coeff.shape[1] != ncas:
mo_coeff = mo_coeff[:, ncore:nocc]
if mo_coeff is None: mo_coeff = self.mo_coeff[:,ncore:nocc]
elif mo_coeff.shape[1] != ncas: mo_coeff = mo_coeff[:,ncore:nocc]

if getattr(self._scf, '_eri', None) is not None:
if getattr (self._scf, '_eri', None) is not None:
eri = ao2mo.full(self._scf._eri, mo_coeff,
max_memory=self.max_memory)
max_memory=self.max_memory)
elif self.with_df:
eri = self.with_df.ao2mo(mo_coeff)

else:
eri = ao2mo.full(self.mol, mo_coeff, verbose=self.verbose,
max_memory=self.max_memory)
max_memory=self.max_memory)
return eri

def compute_pdft_energy_(self, mo_coeff=None, ci=None, ot=None, otxc=None,
Expand All @@ -79,15 +77,15 @@ def compute_pdft_energy_(self, mo_coeff=None, ci=None, ot=None, otxc=None,
nroots = getattr(self.fcisolver, 'nroots', 1)
if isinstance(nroots, list):
epdft = [self.energy_tot(mo_coeff=self.mo_coeff, ci=self.ci, state=ix,
logger_tag='MC-PDFT state {}'.format(ix))
for ix in nroots]
logger_tag='MC-PDFT state {}'.format(ix))
for ix in nroots]
else:
epdft = [self.energy_tot(mo_coeff=self.mo_coeff, ci=self.ci, state=ix,
logger_tag='MC-PDFT state {}'.format(ix))
for ix in range(nroots)]
logger_tag='MC-PDFT state {}'.format(ix))
for ix in range(nroots)]

self.e_ot = [e_ot for e_tot, e_ot in epdft]

if isinstance(self, StateAverageMCSCFSolver):
e_states = [e_tot for e_tot, e_ot in epdft]
try:
Expand All @@ -108,117 +106,89 @@ def compute_pdft_energy_(self, mo_coeff=None, ci=None, ot=None, otxc=None,
e_states = [self.e_tot]
return self.e_tot, self.e_ot, e_states

def multi_state(self, method='Lin'):
if method.upper() == "LIN":
from mrh.my_pyscf.mcpdft._lpdft import linear_multi_state
return linear_multi_state(self)
else:
raise NotImplementedError(f"StateAverageMix not available for {method}")


def get_mcpdft_child_class(mc, ot, DoLASSI=False, states=None, **kwargs):
def get_mcpdft_child_class(mc, ot, DoLASSI=False,states=None,**kwargs):
mc_doc = (mc.__class__.__doc__ or 'No docstring for MC-SCF parent method')

class PDFT(_LASPDFT, mc.__class__):
__doc__ = mc_doc + '\n\n' + _LASPDFT.__doc__
__doc__= mc_doc + '\n\n' + _LASPDFT.__doc__
_mc_class = mc.__class__
setattr(_mc_class, 'DoLASSI', None)
setattr(_mc_class, 'states', None)
setattr(_mc_class, 'statlis', None)
setattr(_mc_class, 'rdmstmpfile', None)

def get_h2eff(self, mo_coeff=None):
if self._in_mcscf_env:
if self._in_mcscf_env:
return mc.__class__.get_h2eff(self, mo_coeff=mo_coeff)
else:
else:
return _LASPDFT.get_h2eff(self, mo_coeff=mo_coeff)

def compute_pdft_energy_(self, mo_coeff=None, ci=None, ot=None, otxc=None,
grids_level=None, grids_attr=None, states=states, **kwargs):
grids_level=None, grids_attr=None, states=states, **kwargs):
return _LASPDFT.compute_pdft_energy_(self, mo_coeff=mo_coeff, ci=ci, ot=ot, otxc=otxc,
grids_level=grids_level, grids_attr=grids_attr, **kwargs)

def multi_state(self, **kwargs):
'''
In future will have to change this to consider the modal space selection, weights...
'''
assert self.DoLASSI, "multi_state is only defined for post LAS methods"
return _LASPDFT.multi_state(self, **kwargs)

multi_state_mix = multi_state
grids_level=grids_level, grids_attr=grids_attr, **kwargs)

if DoLASSI:
if DoLASSI:
_mc_class.DoLASSI = True
_mc_class.rdmstmpfile = tempfile.NamedTemporaryFile(dir=lib.param.TMPDIR)

else:
_mc_class.DoLASSI = False

if states is not None: _mc_class.states = states


else: _mc_class.DoLASSI = False

if states is not None: _mc_class.states=states

if _mc_class.DoLASSI:

'''
The cost of the RDM build is similar to LASSI diagonalization step. Therefore,
calling it 2n time for n-states becomes prohibitively expensive. One alternative
can be just call it once and store all the generated casdm1 and casdm2 and later on
just call a reader function which will read the rdms from this temp file.
'''

def _store_rdms(self):
# MRH: I made it loop over blocks of states to handle the O(N^5) memory cost
# If there's enough memory it'll still do them all at once
log = lib.logger.new_logger (self, self.verbose)
safety_factor = 1.3
mem_per_state = safety_factor*8*(2*(self.ncas**2) + 4*(self.ncas**4)) / 1e6
mem_per_state = 8*(2*(self.ncas**2) + 4*(self.ncas**4)) / 1e6
current_mem = lib.current_memory ()[0]

if current_mem > self.max_memory:
log.warn("Current memory usage (%d MB) exceeds maximum memory (%d MB)",
current_mem, self.max_memory)
log.warn ("Current memory usage (%d MB) exceeds maximum memory (%d MB)",
current_mem, self.max_memory)
nblk = 1
else:
nblk = max (1, int ((self.max_memory - current_mem) / mem_per_state)-1)

log.debug ('_store_rdms: looping over %d states at a time of %d total', nblk,
len (self.e_states))

rdmstmpfile = self.rdmstmpfile
with h5py.File(rdmstmpfile, 'w') as f:
for i in range(0, len(self.e_states), nblk):
j = min(i + nblk, len(self.e_states))
for i in range (0, len (self.states), nblk):
j = min (i+nblk, len (self.states))
rdm1s, rdm2s = lassi.root_make_rdm12s(self, self.ci, self.si,
state=list(range(i, j)))
for k in range(i, j):
state=list(range(i,j)))
for k in range (i, j):
rdm1s_dname = f'rdm1s_{k}'
f.create_dataset(rdm1s_dname, data=rdm1s[k])
rdm2s_dname = f'rdm2s_{k}'
f.create_dataset(rdm2s_dname, data=rdm2s[k])
rdm1s = rdm2s = None

# # This code doesn't seem efficent, have to calculate the casdm1 and casdm2 in different functions.
rdm1s = rdm2s = None

# # This code doesn't seem efficent, have to calculate the casdm1 and casdm2 in different functions.
# def make_one_casdm1s(self, ci=None, state=0, **kwargs):
# with lib.temporary_env (self, verbose=2):
# casdm1s = lassi.root_make_rdm12s (self, ci=ci, si=self.si, state=state)[0]
# return casdm1s
# with lib.temporary_env (self, verbose=2):
# casdm1s = lassi.root_make_rdm12s (self, ci=ci, si=self.si, state=state)[0]
# return casdm1s
# def make_one_casdm2(self, ci=None, state=0, **kwargs):
# with lib.temporary_env (self, verbose=2):
# casdm2s = lassi.root_make_rdm12s (self, ci=ci, si=self.si, state=state)[1]
# return casdm2s.sum ((0,3))

# with lib.temporary_env (self, verbose=2):
# casdm2s = lassi.root_make_rdm12s (self, ci=ci, si=self.si, state=state)[1]
# return casdm2s.sum ((0,3))
def make_one_casdm1s(self, ci=None, state=0, **kwargs):
rdmstmpfile = self.rdmstmpfile
return make_casdm1s(rdmstmpfile, state)

def make_one_casdm2(self, ci=None, state=0, **kwargs):
rdmstmpfile = self.rdmstmpfile
return make_casdm2s(rdmstmpfile, state).sum((0, 3))

return make_casdm2s(rdmstmpfile, state).sum ((0,3))
else:
make_one_casdm1s = mc.__class__.state_make_casdm1s
make_one_casdm2 = mc.__class__.state_make_casdm2
make_one_casdm1s=mc.__class__.state_make_casdm1s
make_one_casdm2=mc.__class__.state_make_casdm2

# TODO: in pyscf-forge/pyscf/mcpdft/mcpdft.py::optimize_mcscf_, generalize the number
# of return arguments. Then the redefinition below will be unnecessary.
Expand All @@ -227,18 +197,21 @@ def optimize_mcscf_(self, mo_coeff=None, ci0=None, **kwargs):
Has the same calling signature as the parent kernel method. '''
with _mcscf_env(self):
if self.DoLASSI:
self.e_states = self.e_roots
self.statlis = [x for x in range(len(self.e_states))]
self.fcisolver.nroots = len(self.e_states) if self.states is None else self.states
if self.states is None:
self.fcisolver.nroots = len(self.e_roots)
self.states = list(range(len(self.e_roots)))
else:
self.fcisolver.nroots = self.states
self._store_rdms()
else:
self.e_mcscf, self.e_cas, self.ci, self.mo_coeff, self.mo_energy = \
self._mc_class.kernel(self, mo_coeff, ci0=ci0, **kwargs)[:-2]
self.fcisolver.nroots = self.nroots

pdft = PDFT(mc._scf, mc.ncas_sub, mc.nelecas_sub, my_ot=ot, **kwargs)

_keys = pdft._keys.copy()
pdft.__dict__.update(mc.__dict__)
pdft.__dict__.update (mc.__dict__)
pdft._keys = pdft._keys.union(_keys)
return pdft


0 comments on commit 1c4970a

Please sign in to comment.