|
import copy, time |
|
import numpy as np |
|
from collections import defaultdict |
|
from rdkit import Chem, RDLogger |
|
from rdkit.Chem import AllChem, rdMolTransforms |
|
from rdkit import Geometry |
|
import networkx as nx |
|
from scipy.optimize import differential_evolution |
|
|
|
RDLogger.DisableLog('rdApp.*') |
|
|
|
""" |
|
Conformer matching routines from Torsional Diffusion |
|
""" |
|
|
|
def GetDihedral(conf, atom_idx): |
|
return rdMolTransforms.GetDihedralRad(conf, atom_idx[0], atom_idx[1], atom_idx[2], atom_idx[3]) |
|
|
|
|
|
def SetDihedral(conf, atom_idx, new_vale): |
|
rdMolTransforms.SetDihedralRad(conf, atom_idx[0], atom_idx[1], atom_idx[2], atom_idx[3], new_vale) |
|
|
|
|
|
def apply_changes(mol, values, rotable_bonds, conf_id): |
|
opt_mol = copy.copy(mol) |
|
[SetDihedral(opt_mol.GetConformer(conf_id), rotable_bonds[r], values[r]) for r in range(len(rotable_bonds))] |
|
return opt_mol |
|
|
|
|
|
def optimize_rotatable_bonds(mol, true_mol, rotable_bonds, probe_id=-1, ref_id=-1, seed=0, popsize=15, maxiter=500, |
|
mutation=(0.5, 1), recombination=0.8): |
|
opt = OptimizeConformer(mol, true_mol, rotable_bonds, seed=seed, probe_id=probe_id, ref_id=ref_id) |
|
max_bound = [np.pi] * len(opt.rotable_bonds) |
|
min_bound = [-np.pi] * len(opt.rotable_bonds) |
|
bounds = (min_bound, max_bound) |
|
bounds = list(zip(bounds[0], bounds[1])) |
|
|
|
|
|
result = differential_evolution(opt.score_conformation, bounds, |
|
maxiter=maxiter, popsize=popsize, |
|
mutation=mutation, recombination=recombination, disp=False, seed=seed) |
|
opt_mol = apply_changes(opt.mol, result['x'], opt.rotable_bonds, conf_id=probe_id) |
|
|
|
return opt_mol |
|
|
|
|
|
class OptimizeConformer: |
|
def __init__(self, mol, true_mol, rotable_bonds, probe_id=-1, ref_id=-1, seed=None): |
|
super(OptimizeConformer, self).__init__() |
|
if seed: |
|
np.random.seed(seed) |
|
self.rotable_bonds = rotable_bonds |
|
self.mol = mol |
|
self.true_mol = true_mol |
|
self.probe_id = probe_id |
|
self.ref_id = ref_id |
|
|
|
def score_conformation(self, values): |
|
for i, r in enumerate(self.rotable_bonds): |
|
SetDihedral(self.mol.GetConformer(self.probe_id), r, values[i]) |
|
return RMSD(self.mol, self.true_mol, self.probe_id, self.ref_id) |
|
|
|
|
|
def get_torsion_angles(mol): |
|
torsions_list = [] |
|
G = nx.Graph() |
|
for i, atom in enumerate(mol.GetAtoms()): |
|
G.add_node(i) |
|
nodes = set(G.nodes()) |
|
for bond in mol.GetBonds(): |
|
start, end = bond.GetBeginAtomIdx(), bond.GetEndAtomIdx() |
|
G.add_edge(start, end) |
|
for e in G.edges(): |
|
G2 = copy.deepcopy(G) |
|
G2.remove_edge(*e) |
|
if nx.is_connected(G2): continue |
|
l = list(sorted(nx.connected_components(G2), key=len)[0]) |
|
if len(l) < 2: continue |
|
n0 = list(G2.neighbors(e[0])) |
|
n1 = list(G2.neighbors(e[1])) |
|
torsions_list.append( |
|
(n0[0], e[0], e[1], n1[0]) |
|
) |
|
return torsions_list |
|
|
|
|
|
|
|
def get_torsions(mol_list): |
|
print('USING GEOMOL GET TORSIONS FUNCTION') |
|
atom_counter = 0 |
|
torsionList = [] |
|
for m in mol_list: |
|
torsionSmarts = '[!$(*#*)&!D1]-&!@[!$(*#*)&!D1]' |
|
torsionQuery = Chem.MolFromSmarts(torsionSmarts) |
|
matches = m.GetSubstructMatches(torsionQuery) |
|
for match in matches: |
|
idx2 = match[0] |
|
idx3 = match[1] |
|
bond = m.GetBondBetweenAtoms(idx2, idx3) |
|
jAtom = m.GetAtomWithIdx(idx2) |
|
kAtom = m.GetAtomWithIdx(idx3) |
|
for b1 in jAtom.GetBonds(): |
|
if (b1.GetIdx() == bond.GetIdx()): |
|
continue |
|
idx1 = b1.GetOtherAtomIdx(idx2) |
|
for b2 in kAtom.GetBonds(): |
|
if ((b2.GetIdx() == bond.GetIdx()) |
|
or (b2.GetIdx() == b1.GetIdx())): |
|
continue |
|
idx4 = b2.GetOtherAtomIdx(idx3) |
|
|
|
if (idx4 == idx1): |
|
continue |
|
if m.GetAtomWithIdx(idx4).IsInRing(): |
|
torsionList.append( |
|
(idx4 + atom_counter, idx3 + atom_counter, idx2 + atom_counter, idx1 + atom_counter)) |
|
break |
|
else: |
|
torsionList.append( |
|
(idx1 + atom_counter, idx2 + atom_counter, idx3 + atom_counter, idx4 + atom_counter)) |
|
break |
|
break |
|
|
|
atom_counter += m.GetNumAtoms() |
|
return torsionList |
|
|
|
|
|
def A_transpose_matrix(alpha): |
|
return np.array([[np.cos(alpha), np.sin(alpha)], [-np.sin(alpha), np.cos(alpha)]], dtype=np.double) |
|
|
|
|
|
def S_vec(alpha): |
|
return np.array([[np.cos(alpha)], [np.sin(alpha)]], dtype=np.double) |
|
|
|
|
|
def GetDihedralFromPointCloud(Z, atom_idx): |
|
p = Z[list(atom_idx)] |
|
b = p[:-1] - p[1:] |
|
b[0] *= -1 |
|
v = np.array([v - (v.dot(b[1]) / b[1].dot(b[1])) * b[1] for v in [b[0], b[2]]]) |
|
|
|
v /= np.sqrt(np.einsum('...i,...i', v, v)).reshape(-1, 1) |
|
b1 = b[1] / np.linalg.norm(b[1]) |
|
x = np.dot(v[0], v[1]) |
|
m = np.cross(v[0], b1) |
|
y = np.dot(m, v[1]) |
|
return np.arctan2(y, x) |
|
|
|
|
|
def get_dihedral_vonMises(mol, conf, atom_idx, Z): |
|
Z = np.array(Z) |
|
v = np.zeros((2, 1)) |
|
iAtom = mol.GetAtomWithIdx(atom_idx[1]) |
|
jAtom = mol.GetAtomWithIdx(atom_idx[2]) |
|
k_0 = atom_idx[0] |
|
i = atom_idx[1] |
|
j = atom_idx[2] |
|
l_0 = atom_idx[3] |
|
for b1 in iAtom.GetBonds(): |
|
k = b1.GetOtherAtomIdx(i) |
|
if k == j: |
|
continue |
|
for b2 in jAtom.GetBonds(): |
|
l = b2.GetOtherAtomIdx(j) |
|
if l == i: |
|
continue |
|
assert k != l |
|
s_star = S_vec(GetDihedralFromPointCloud(Z, (k, i, j, l))) |
|
a_mat = A_transpose_matrix(GetDihedral(conf, (k, i, j, k_0)) + GetDihedral(conf, (l_0, i, j, l))) |
|
v = v + np.matmul(a_mat, s_star) |
|
v = v / np.linalg.norm(v) |
|
v = v.reshape(-1) |
|
return np.arctan2(v[1], v[0]) |
|
|
|
|
|
def get_von_mises_rms(mol, mol_rdkit, rotable_bonds, conf_id): |
|
new_dihedrals = np.zeros(len(rotable_bonds)) |
|
for idx, r in enumerate(rotable_bonds): |
|
new_dihedrals[idx] = get_dihedral_vonMises(mol_rdkit, |
|
mol_rdkit.GetConformer(conf_id), r, |
|
mol.GetConformer().GetPositions()) |
|
mol_rdkit = apply_changes(mol_rdkit, new_dihedrals, rotable_bonds, conf_id) |
|
return RMSD(mol_rdkit, mol, conf_id) |
|
|
|
|
|
def mmff_func(mol): |
|
mol_mmff = copy.deepcopy(mol) |
|
AllChem.MMFFOptimizeMoleculeConfs(mol_mmff, mmffVariant='MMFF94s') |
|
for i in range(mol.GetNumConformers()): |
|
coords = mol_mmff.GetConformers()[i].GetPositions() |
|
for j in range(coords.shape[0]): |
|
mol.GetConformer(i).SetAtomPosition(j, |
|
Geometry.Point3D(*coords[j])) |
|
|
|
|
|
RMSD = AllChem.AlignMol |
|
|