Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Implemented atomic representation for a single element type and valence electron only representation #39

Merged
merged 18 commits into from
May 9, 2024
Merged
Show file tree
Hide file tree
Changes from 7 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
22 changes: 16 additions & 6 deletions qstack/spahm/rho/atom.py
Copy link
Contributor

@briling briling May 7, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

maybe this

    for j,i in enumerate(only_i):
        q = mol.elements[i]
        v = rep[j]

can be replaced with this

    for q, v in zip(mol.elements[only_i], rep):

which is easier to read and more similar to the previous version

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

maybe even a one liner

mrep = [np.array((q, v), dtype=object) for q, v in zip(mol.elements[only_i], rep)]

but not sure about readability

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I liked the one line. but it doesn't work cause mol.elements is a list and not a numpy.array so you can not subscript it with a list of integers.
the intermediate option does not work neither then!

I can create a copy of mol.elements in a numpy.array and go for the oneliner, but it feels a bit like an overhead.
what do you think?

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

i'd put zip(np.array(mol.elements)[only_i], rep)] lol

Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I just don't like j,i

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

ahah sure! Done 👌

Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@ def check_file(mol_file):
def get_repr(mol, elements, charge, spin,
open_mod=defaults.omod, dm=None,
guess=defaults.guess, model=defaults.model, xc=defaults.xc,
auxbasis=defaults.auxbasis):
auxbasis=defaults.auxbasis, only_z=[], valence_only=False):

# User-defined options
elements = sorted(list(set(elements)))
Expand All @@ -31,11 +31,16 @@ def get_repr(mol, elements, charge, spin,
# Compute density matrices
if dm is None:
dm = spahm.compute_spahm.get_guess_dm(mol, guess, openshell=spin, xc=xc)
# if only the representations for a given atom type are to be computed restricts the considered atomic indices
if len(only_z) != 0:
only_i = [i for i,z in enumerate(mol.elements) if z in only_z]
else:
only_i = range(mol.natm) #otherwise consider the full list of atomic indices

rep = []
for omod in open_mod:
DM = utils.dm_open_mod(dm, omod) if spin is not None else dm
c_df = df_wrapper(mol, DM, auxbasis)
c_df = df_wrapper(mol, DM, auxbasis, only_i=only_i, valence_only=valence_only)
vectors = sym_wrapper(c_df, mol, idx, ao, ao_len, M, elements)
if spin is None:
rep = vectors
Expand All @@ -46,8 +51,10 @@ def get_repr(mol, elements, charge, spin,
rep = np.hstack(rep)

mrep = []
for q, v in zip(mol.elements, rep):
mrep.append(np.array((q, v)))
for j,i in enumerate(only_i):
q = mol.elements[i]
v = rep[j]
mrep.append(np.array((q, v), dtype=object))
return np.array(mrep)


Expand All @@ -61,21 +68,24 @@ def main():
parser.add_argument('--model', dest='model', default=defaults.model, type=str, help=f"the model to use when creating the representation (default: {defaults.model})")
parser.add_argument('--dm', dest='dm', default=None, type=str, help="a density matrix to load instead of computing the guess")
parser.add_argument('--species', dest='elements', default=defaults.elements, nargs='+', type=str, help="the elements contained in the database")
parser.add_argument('--only', dest='only_z', default=[], nargs='+', type=str, help="The restricted list of elements for which you want to generate the representation")
parser.add_argument('--charge', dest='charge', default=0, type=int, help='total charge of the system (default: 0)')
parser.add_argument('--spin', dest='spin', default=None, type=int, help='number of unpaired electrons (default: None) (use 0 to treat a closed-shell system in a UHF manner)')
parser.add_argument('--xc', dest='xc', default=defaults.xc, type=str, help=f'DFT functional for the SAD guess (default: {defaults.xc})')
parser.add_argument('--nameout', dest='NameOut', default=None, type=str, help='name of the output representations file.')
parser.add_argument('--omod', dest='omod', default=defaults.omod, nargs='+', type=str, help=f'model(s) for open-shell systems (alpha, beta, sum, diff, default: {defaults.omod})')
parser.add_argument('--valence', dest='valence_only', action='store_true', help=f'to generate valence density only representations')
args = parser.parse_args()
print(vars(args))

mol = compound.xyz_to_mol(check_file(args.mol), args.basis, charge=args.charge, spin=args.spin, unit=args.units)
dm = None if args.dm is None else np.load(args.dm)

representations = get_repr(mol, elements, args.charge, args.spin,
representations = get_repr(mol, args.elements, args.charge, args.spin,
open_mod=args.omod,
dm=dm, guess=args.guess, model=args.model,
xc=args.xc, auxbasis=args.auxbasis)
xc=args.xc, auxbasis=args.auxbasis, only_z=args.only_z,
valence_only=args.valence_only)

# output dir
cwd = os.getcwd()
Expand Down
10 changes: 8 additions & 2 deletions qstack/spahm/rho/atomic_density.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,11 +3,15 @@
from . import lowdin


def fit(mol, dm, aux_basis, short=False, w_slicing=True):
def fit(mol, dm, aux_basis, short=False, w_slicing=True, only_i=[], valence_only=False):

L = lowdin.Lowdin_split(mol, dm)

dm_slices = mol.aoslice_nr_by_atom()[:,2:]
if len(only_i) != 0:
dm_slices = mol.aoslice_nr_by_atom()[only_i,2:]
else:
dm_slices = mol.aoslice_nr_by_atom()[:,2:]

auxmol = compound.make_auxmol(mol, aux_basis)
eri2c, eri3c = fields.decomposition.get_integrals(mol, auxmol)[1:]

Expand All @@ -24,6 +28,8 @@ def fit(mol, dm, aux_basis, short=False, w_slicing=True):
a_dm1 = np.zeros_like(L.dmL)
a_dm1[start:stop,:] += L.dmL[start:stop,:]*0.5
a_dm1[:,start:stop] += L.dmL[:,start:stop]*0.5
if valence_only:
a_dm1[start:stop,start:stop] = 0
a_dm0 = L.S12i @ a_dm1 @ L.S12i

c_a = fields.decomposition.get_coeff(a_dm0, J, eri3c)
Expand Down
16 changes: 8 additions & 8 deletions qstack/spahm/rho/dmb_rep_atom.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,17 +29,17 @@ def df_sad_diff(mol, dm, auxbasis):
dm = dm - dm_sad
return fields.decomposition.decompose(mol, dm, auxbasis)[1]

def df_lowdin_long(mol, dm, auxbasis):
return atomic_density.fit(mol, dm, auxbasis)
def df_lowdin_long(mol, dm, auxbasis, only_i=[], valence_only=False):
return atomic_density.fit(mol, dm, auxbasis, only_i=only_i, valence_only=valence_only)

def df_lowdin_short(mol, dm, auxbasis):
return atomic_density.fit(mol, dm, auxbasis, short=True)
def df_lowdin_short(mol, dm, auxbasis, only_i=[], valence_only=False):
return atomic_density.fit(mol, dm, auxbasis, short=True, only_i=only_i, valence_only=valence_only)

def df_lowdin_long_x(mol, dm, auxbasis):
return atomic_density.fit(mol, dm, auxbasis, w_slicing=False)
def df_lowdin_long_x(mol, dm, auxbasis, only_i=[], valence_only=False):
return atomic_density.fit(mol, dm, auxbasis, w_slicing=False, only_i=only_i, valence_only=valence_only)

def df_lowdin_short_x(mol, dm, auxbasis):
return atomic_density.fit(mol, dm, auxbasis, short=True, w_slicing=False)
def df_lowdin_short_x(mol, dm, auxbasis, only_i=[], valence_only=False):
return atomic_density.fit(mol, dm, auxbasis, short=True, w_slicing=False, only_i=only_i, valence_only=valence_only)

def df_occup(mol, dm, auxbasis):
L = lowdin.Lowdin_split(mol, dm)
Expand Down
Binary file added tests/data/SPAHM_a_H2O/X_H2O_valence-only.npy
Binary file not shown.
24 changes: 24 additions & 0 deletions tests/test_spahm_a.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,6 +43,30 @@ def test_water_SAD_guess_close_shell():
assert(a[0] == a_true[0]) # atom type
assert(np.linalg.norm(a[1]-a_true[1]) < 1e-08) # atom representations

def test_water_single_element():
path = os.path.dirname(os.path.realpath(__file__))
mol = compound.xyz_to_mol(path+'/data/H2O.xyz', 'minao', charge=0, spin=None)

X = atom.get_repr(mol, ["H", "O"], 0, None, dm=None,
guess='LB', model='lowdin-long-x', auxbasis='ccpvdzjkfit', only_z=['O']) #requesting reps for O-atom only

X_true = np.load(path+'/data/SPAHM_a_H2O/X_H2O.npy', allow_pickle=True)
a = X[0]
for a_true in X_true:
if a[0] == a_true[0]: # atom type
assert(np.linalg.norm(a[1]-a_true[1]) < 1e-08) # atom representations

def test_water_valence_only():
path = os.path.dirname(os.path.realpath(__file__))
mol = compound.xyz_to_mol(path+'/data/H2O.xyz', 'minao', charge=0, spin=None)

X = atom.get_repr(mol, ["H", "O"], 0, None, dm=None,
guess='LB', model='lowdin-long-x', auxbasis='ccpvdzjkfit', valence_only=True)
X_true = np.load(path+'/data/SPAHM_a_H2O/X_H2O_valence-only.npy', allow_pickle=True)
assert(X.shape == X_true.shape)
for a, a_true in zip(X, X_true):
assert(a[0] == a_true[0]) # atom type
assert(np.linalg.norm(a[1]-a_true[1]) < 1e-08) # atom representations


if __name__ == '__main__':
Expand Down
Loading