Skip to content

Instantly share code, notes, and snippets.

@ptosco
Created August 14, 2020 20:31
Show Gist options
  • Save ptosco/36574d7f025a932bc1b8db221903a8d2 to your computer and use it in GitHub Desktop.
Save ptosco/36574d7f025a932bc1b8db221903a8d2 to your computer and use it in GitHub Desktop.
CanonicalReordering
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"from rdkit import Chem\n",
"from rdkit.Chem.Draw import MolsToGridImage"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"def addAtomIndices(mol):\n",
" for i, a in enumerate(mol.GetAtoms()):\n",
" a.SetAtomMapNum(i)"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"m = Chem.MolFromSmiles(\"CC[C@H](C1=CC=CC2=C1C=CC=C2)C\")\n",
"m1 = Chem.MolFromInchi(\"InChI=1S/C14H16/c1-3-11(2)13-10-6-8-12-7-4-5-9-14(12)13/h4-11H,3H2,1-2H3/t11-/m1/s1\")"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"True"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Chem.MolToSmiles(m) == Chem.MolToSmiles(m1)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [],
"source": [
"m_neworder = tuple(zip(*sorted([(j, i) for i, j in enumerate(Chem.CanonicalRankAtoms(m))])))[1]"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [],
"source": [
"m1_neworder = tuple(zip(*sorted([(j, i) for i, j in enumerate(Chem.CanonicalRankAtoms(m1))])))[1]"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"False"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"m_neworder == m1_neworder"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [],
"source": [
"addAtomIndices(m)"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [],
"source": [
"addAtomIndices(m1)"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<PIL.PngImagePlugin.PngImageFile image mode=RGB size=600x200 at 0x7FAE4C1997B8>"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"MolsToGridImage((m, m1))"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [],
"source": [
"m_renum = Chem.RenumberAtoms(m, m_neworder)"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [],
"source": [
"m1_renum = Chem.RenumberAtoms(m1, m1_neworder)"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [],
"source": [
"addAtomIndices(m_renum)"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [],
"source": [
"addAtomIndices(m1_renum)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<PIL.PngImagePlugin.PngImageFile image mode=RGB size=600x200 at 0x7FAE4C127390>"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"MolsToGridImage((m_renum, m1_renum))"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.10"
}
},
"nbformat": 4,
"nbformat_minor": 4
}
@JanCBrammer
Copy link

Thanks @ptosco, the gist saves the day!

For those who, like me, find it taxing to parse the expression in cells 5 and 6, here's the expression somewhat unpacked:

canon_idx_old_idx = [(j, i) for i, j in enumerate(CanonicalRankAtoms(m))] # [(0, 0), (2, 1), (1, 2)]
old_idcs_sorted_by_canon_idcs = tuple(zip(*sorted(canon_idx_old_idx))) # ((0, 1, 2), (0, 2, 1))
canonical_order = old_idcs_sorted_by_canon_idcs[1] # (0, 2, 1)

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment