Skip to content

Instantly share code, notes, and snippets.

@jp-um
Created June 16, 2017 10:53
Show Gist options
  • Save jp-um/4e9c1fad979a747833bd3d386a54699f to your computer and use it in GitHub Desktop.
Save jp-um/4e9c1fad979a747833bd3d386a54699f to your computer and use it in GitHub Desktop.
cheminformatics primer
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/usr/local/lib/python2.7/dist-packages/IPython/html.py:14: ShimWarning: The `IPython.html` package has been deprecated since IPython 4.0. You should import from `notebook` instead. `IPython.html.widgets` has moved to `ipywidgets`.\n",
" \"`IPython.html.widgets` has moved to `ipywidgets`.\", ShimWarning)\n"
]
}
],
"source": [
"import rdkit\n",
"from rdkit import Chem\n",
"from rdkit import DataStructs\n",
"from rdkit.Chem import AllChem\n",
"\n",
"from rdkit.Chem.Draw import IPythonConsole #Needed to show molecules\n",
"from rdkit.Chem import Draw"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [],
"source": [
"# John wants some alkenes (or alkanes?) ... let us show him some\n",
"\n",
"# alkene\n",
"ethene = Chem.MolFromSmiles(\"C=C\")\n",
"propene = Chem.MolFromSmiles(\"CC=C\")\n",
"\n",
"# alkane\n",
"methane = Chem.MolFromSmiles(\"C\")\n",
"ethane = Chem.MolFromSmiles(\"CC\")\n",
"\n",
"# note in cheminformatics we typically ignore Hs, as these are everywhere and double the size of the graph"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAKAklEQVR4nO3dYUjUhx/H8c+VlXYZ\nldGWOGqonUqxllFZXXk9ajAHsVEQZHsQBHuwq8EY1RiyqIiodj3Yo6CwZ/YsYYbRflpZc80sFK1x\nZxZJVyS1ynk6r9//wSBw/2quTn/m9/16dlp3H39P3v5+v1N9ruu6AgDAqHFeDwAAwEuEEABgGiEE\nAJhGCAEAphFCAIBphBAAYBohBACYRggBAKYRQgCAaYQQAGAaIQQAmEYIAQCmEUIAgGmEEABgGiEE\nAJhGCAEAphFCAIBphBAAYBohBACYRggBAKYRQgCAaYQQAGAaIQQAmEYIAQCmEUIAgGmEEABgGiEE\nAJhGCAEAphFCAIBphBAAYBohBACYRghhyvHjx9Xe3j7oY9evX9exY8c8WuQdjgXwN0IIADCNEAIA\nTCOEAADT0rweAIy0M2fOyHGc54+TyaSmTJni4SLvcCwAQgiDgsGg8vLynj+OxWJqbm72cJF3OBYA\nIYRB6enpyszMHPTYKo4FwD1C4IWePn3q9YSUG4tfE5AKhBD4h7t37+ro0aM6d+6c+vv7vZ7zxvr7\n+3Xu3DkdPXpU8Xjc6znAqONzXdf1egQw2ty+fVt1dXV68uSJSkpKtHDhQo0b93Z935hMJtXU1KTL\nly8rMzNToVBI7733ntezgFGHEAIv4bqu2tvbVV9fr/T0dJWWlur999/3etaQ3Lx5U3V1dUokElq9\nerUKCwvl8/m8ngWMSoQQ+BeJREKXL19WU1OTcnJyFAqFlJWV5fWsF+ru7pbjOLpz546Ki4u1ZMkS\nTZo0yetZwKhGCIEhevjwoerq6tTZ2amFCxdq+fLloyYyfX19unjxoq5evaq5c+eqtLRU06dP93oW\n8FYghMB/dOvWLTmOoz///FPLli3Thx9+6NllR9d11dzcrF9++UV+v1+lpaWaM2eOJ1uAtxUhBF7D\ns2fP1NraqgsXLjx/I0pOTs6Ibujs7JTjOOrt7dXKlSs1f/78t+4NPcBoQAiBN9DT06Pz58+rra1N\n+fn5Ki4uVnZ29rC+ZldXl5qamhSNRlVUVKRgMCi/3z+srwmMZXz7CLwBv9+vtWvXauPGjTp9+rQC\ngYD27dunRCKR8tdKJBLau3evAoGAamtrtXHjRq1du5YIAm+IM0Ighaqrq7V9+3b19vZq37592rRp\n0xvfP3RdVydOnNCOHTuUkZGhw4cPq6ysLEWLARBCIMX++usv/fjjj/ruu+8UCAR05MgRLVu27LWe\n69KlSwqHw7px44a+//57ffHFF5owYUKKFwO2cWkUSLEJEyYoHA4rFouppKREwWBQ5eXlunfv3pCf\nIx6Pq7y8XKtWrVJJSYlisZjC4TARBIYBIQSGycyZMxWJRNTY2KjOzk7l5uaqoqJCfX19L/0/fX19\nqqioUF5enm7duqXGxkZFIhHNnDlzBJcDtnBpFBgh1dXVCofDSktL08GDB//vPt/Jkye1a9cuDQwM\nKBKJcB8QGCGEEBhBvb29OnLkiPbs2aOlS5fqhx9+kCRt27ZNjY2N2rVrl7788ktlZGR4OxQwhBAC\nHujo6NDXX3+tn376Sa7r6uOPP9aBAwfeml/qDYwlhBDw0Pr16yVJVVVVHi8B7ErzegBg2bRp07ye\nAJjHu0YBAKYRQmAY9fX1qbq6+pU/MgHAW4QQGEbd3d365JNP1N3d7fUUAC9BCAEAphFCAIBphBAA\nYBohBACYRggBAKYRQgCAaYQQAGAaIQQAmEYIAQCmEUIAgGmEEABgGiEEAJhGCAEAphFCAIBphBAA\nYBohBACYRggBAKYRQgCAaYQQAGAaIQQAmEYIAQCmEUIAgGmEEABgGiEEAJhGCAEAphFCAIBphBAA\nYBohBACYRggBAKYRQmAYZWVl6dSpU8rKyvJ6CoCXSPN6ADCWTZo0SWVlZV7PAPAKnBECAEzjjBDw\n0KNHj7yeAJjHGSHggY6ODn366aeqrq7WqVOn9Nlnn+nmzZtezwJMIoTACHrw4IG2bt2qgoIC+f1+\nxWIxdXR0aPLkyQoEAtq6dasePHjg9UzAFEIIjICBgQFFIhEFAgG1tLSooaFBlZWVys7OVnZ2tior\nK9XQ0KCWlhYFAgFFIhENDAx4PRswwee6ruv1CGAsq6mp0VdffaVHjx5p//792rRpk3w+3wv/reu6\nOnHihL755htNmzZNhw4d0kcffTTCiwFbOCMEhkksFlNZWZnWrVunDRs2KBqNqry8/KURlCSfz6fy\n8nJFo1Ft2LBB69atU1lZmWKx2AguB2whhECK/fHHHwqHwyosLFRGRoZaW1tVUVEhv98/5Ofw+/2q\nqKhQS0uLMjIyVFhYqHA4rMePHw/jcsAmQgikSDKZVCQSUW5urn7++WfV1NSoqqpKeXl5r/2c+fn5\nqqqqUk1Njc6ePavc3FxFIhElk8kULgds4x4hkALxeFy7d+9WZWWldu7cqe3btys9PT2lr5FIJHTo\n0CHt3btXn3/+ub799lu9++67KX0NwCJCCLyBnp4enT9/Xm1tbcrPz1dxcbGys7OH9TW7urrU1NSk\naDSqoqIiBYPB/3TZFcBghBB4Df39/WpsbNSVK1eUk5OjUCikGTNmjOiG+/fvy3EcxeNxLVq0SEuX\nLtXEiRNHdAMwFhBC4D9wXVctLS26dOmSxo8fr1AopNzcXE83xWIxOY6jZDKpkpISLViw4JXvTAUw\nGCEEhqirq0uO4+jhw4dasWKFPvjgA40fP97rWZL+fqPOtWvX1NDQoOnTp2vNmjXDfokWGCsIIfAv\nHj9+rPr6ekWjUc2fP1/Lly8ftffkenp6dPHiRbW2tiovL0+rV6/W1KlTvZ4FjGqEEHiJgYEB/frr\nr/rtt980a9YshUIhvfPOO17PGpJ79+7JcRzdv39fixcv1pIlS5SWxh+bAV6EEAIv0NbWpgsXLsjn\n82nNmjWe3wd8Xb///rvq6+vluq5WrlypoqIirycBow4/UA9Tjh8/rvb29kEfu379uo4dO/b88d27\nd1VbW6uCggJt3rz5rY2gJM2bN0+bN29WQUGBamtrFY/Hn39uKMcCsIBrJcA/zJ49W1u2bNGUKVO8\nnpISEydO1KpVq7Ro0aIx8zUBqcQZIfACYzEYY/FrAlKBEAIATOPSKMw5c+aMHMd5/jiZTJo9W+JY\nAIQQBgWDwUF/ESIWi6m5udnDRd7hWACEEAalp6crMzNz0GOrOBYA9wgBAMYRQgCAafxmGQCAaZwR\nAgBMI4QAANMIIQDANEIIADCNEAIATCOEAADTCCEAwDRCCAAwjRACAEwjhAAA0wghAMA0QggAMI0Q\nAgBMI4QAANMIIQDANEIIADCNEAIATCOEAADTCCEAwDRCCAAwjRACAEwjhAAA0wghAMA0QggAMI0Q\nAgBMI4QAANMIIQDANEIIADCNEAIATCOEAADTCCEAwLT/AU5BEzJkg2xCAAAAAElFTkSuQmCC\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a180b16e0>"
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Chem.AddHs(ethene) "
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAQo0lEQVR4nO3dfUyV5ePH8Q8HETE0\nTU2zNBJUsLTEfMqwJ81y6lrNiqVUulELp83Htpq4LIeJK6tRtsqHNUuorSxsBUsTdRYUIk4gxSRL\nw4o0FBE55/r+8R3u6+/XwzHPOdeB6/3a/OM+nOu+P2y6j9f9dEUYY4wAAHCUx3YAAABsoggBAE6j\nCAEATqMIAQBOowgBAE6jCAEATqMIAQBOowgBAE6jCAEATqMIAQBOowgBAE6jCAEATqMIAQBOowgB\nAE6jCAEATqMIAQBOowgBAE6jCAEATqMIAQBOowgBAE6jCAEATqMIgRBau3atKioqzvussrJSa9as\nsZQIAEUIAHAaRQgAcBpFCABwWjvbAQDXFBQUaMuWLee2vV6vYmNjLSYC3EYRAiGWkpKihISEc9vV\n1dUqLS21mAhwG0UIhFiHDh3UqVOn87YB2MM1QgCA0yhCAIDTIowxxnYIAABsYUYIAHAaRQgAcBpF\nCABwGkUIAHAaRQhYcuTIEf3www+2YwDO44F6wJIDBw7ojz/+UN++fW1HAZzGjBCwxOPxyOfz2Y4B\nOI8iBCzxeDzyer22YwDOowgBSyIjI5kRAmGAIgQs4dQoEB4oQsASihAIDxQhYAnXCIHwQBEClnCN\nEAgPFCFgCTNCIDxQhIAlbWVGuHbtWlVUVJz3WWVlpdasWWMpEXBhKELAEm6WAcIDRQhYQhEC4YEi\nBCzhGiEQHnjpNmBRVFSU7QgBUVBQoC1btpzb9nq9io2NtZgI8B9FCFhy6NAhzZ07VzNnzrQd5aKl\npKQoISHh3HZ1dbVKS0stJgL8RxEClkRFRens2bO2YwREhw4d1KlTp/O2gdaCa4SAJW2pCIHWjCIE\nLGnfvr2am5tljLEdBXBahOFfIWDFnj17dP3116upqanN3DQDtEbMCAFLWsqP06OAXRQhYAlFCIQH\nihCwhCIEwgNFCFjSUoRNTU2Wk1y42tpaNTQ02I4BBARFCARJc3OzXnrpJeXl5f3pz1vrjNDn8yk/\nP19lZWW2owABQRECQVBUVKTk5GStXLlSMTExf/qd9u3bS2p9RVhaWqrm5mYNHz7cdhQgIChChIwL\n69bV1NRo8uTJuvPOO3Xvvffqu+++06RJk/70u61xRnj69Gnt2rVLo0ePVrt2vJgKbQNFCATAmTNn\ntGTJEg0aNEg+n0979+7VkiVL/nI2KLXOIvz666/VuXNnXXfddbajAAFDEQIX6fPPP9eQIUO0du1a\nvffee8rPz1d8fPw/jjt9+rSk/84iW4Pjx4+rtLRUKSkpioiIsB0HCBiKEPiXDh8+rMmTJ2vKlClK\nTU3Vvn37NHnyZL/Gbty4UUlJSUpMTNTUqVM1b9481dXVBTnxxdmxY4euuuoqxcXF2Y4CBBQn+RFS\nbWHduqamJi1btkzZ2dkaM2aMysvL1b9/f7/GFhcX64knnlBVVZWWLl2qjIwMFRcXa8GCBerbt69m\nzZqlp59++ryVHMLBkSNHVFVVpenTp9uOAgQcRYiQau3r1hUWFmrWrFlqaGjQu+++6/cM8MSJE1q8\neLFycnKUmpqqjz76SL1795YkjR49WkVFRXr//ff11FNP6Z133tHixYs1c+ZMRUZGBvPX8VtRUZGS\nkpLUo0cP21GAgOPUKEKqZd26lj+tZd262tpapaWlaeLEibrnnntUUVHhVwkaY7R+/XolJiaqsLBQ\nn3/+udavX3+uBFtERERo6tSpqqio0OLFi/XMM89o8ODBf/kMYihVV1ertrZWKSkptqMAQUERIqzs\n3btXBw4csB3jHK/Xq1WrVmngwIE6ePCgiouLlZWVpUsuueQfx+7du1e33nqrMjIy9NRTT2n37t26\n7bbb/nZM+/btlZ6erqqqKk2ZMkVpaWkaP368tVmzz+fTtm3blJyc3OpOYQP+oggRVk6dOqX8/Hxt\n3LhRR48etZpl586dGjZsmJYtW6aXX35ZRUVFuv766/9xXH19vebMmaPk5GRdffXVqqio0Jw5cy5o\nqaWuXbsqKytLVVVVuuKKKzR8+HDdf//9OnTo0EX8RheuvLxcjY2NGjFiREiPC4SUAcJMQ0OD2bZt\nm3nxxRdNXl6eOXbsWEiPX1tba6ZPn27atWtnZs+ebX7//Xe/x65bt8707t3b9OvXz3z88ccBy1Rc\nXGxuueUWExMTYxYtWmSOHz8esH3/lZMnT5qXX37ZlJSUBP1YgE0UIcJWXV2d2bRpk1m5cqXZvHmz\nqa+vD+rxmpubzUsvvWS6dOliRo0aZb755hu/x+7bt8/cdtttpkOHDiYzM9M0NDQEJWNBQYG57rrr\nTLdu3UxWVpZpbGwMynGMMWbx4sVmwIABpqmpKWjHAMIBRYiwd+TIEfPee++ZVatWmW3btpkzZ84E\n/Bg7d+40Q4cONd27dzfr1q0zXq/Xr3H19fVm9uzZJioqykycONEcOHAg4Nn+r7Nnz5rVq1ebXr16\nmQEDBpjc3Fzj8/kCeozDhw+bmJgY88EHHwR0v0A4ijDGGNunZwF/VFdX68svv1RjY6NuvPFGDRs2\n7KIfL/jll180b948bdiwQRkZGcrMzNRll13m19i8vDzNnTtXkZGReuWVV/x+lCJQTp06pVdffVXP\nP/+8Bg0apBUrVgTszs709HRVVFSoqKgoIPsDwprtJgYuhNfrNWVlZSYnJ8e89dZbpqqq6l/tx+fz\nmXfeecdcccUVZuDAgaawsNDvsQcPHjSTJk0y0dHRJjMz05w6depfZQiUH3/80aSnp5vIyEgzadIk\ns3///ovaX3l5uWnXrp3ZtWtXgBIC4Y0ZIVqlxsZG7dq1S7t379ZVV12lkSNHqk+fPhe0j9TUVI0a\nNUoZGRl+raTQ2NiorKwsvfDCCxo7dqxeeeUVv98oEwoVFRXKzMzUhx9+qEcffVRLly7V5ZdffsH7\nmTx5smJiYpSbmxuElEAYst3EwMU4ceKEyc/PN3FxcWb69Onmhx9+CMpxNm/ebOLj402fPn3Mpk2b\ngnKMQCkoKDBDhw41sbGxJjMz05w+fdrvsYWFhSY6OtocPHgwiAmB8MJzhGjVOnfurIkTJ2rz5s1q\nbGxUfHy8HnvsMR07diwg+29ZX/Cee+7RtGnT/H6jjE3jxo1TSUmJ3n77ba1bt079+/fXG2+8Ia/X\n+7fjfD6fFixYoMcff1zXXHNNiNICYcB2EwOBVFhY+K9nQ/+rsbHRZGZmmo4dO5px48aZysrKACcN\njYaGBpOVlWUuvfRSM2zYMPPFF1/85Xc3bNhgLrvsMlNXVxfChIB9FCHaHK/Xa3Jzc01cXJzp06eP\nWb16td+PQxhjzGeffWb69+9vevbsadatWxfwRxNs+PXXX82iRYtMdHS0GTdunCkrKzvv542NjSYu\nLs4sX77cUkLAHk6Nos3xeDyaOnWq9u3bp4yMDC1cuFAjRozQ1q1b/3Zcy/qCEydO1N13363Kykql\npaW1iUVou3XrpqysLO3Zs0ddu3ZVcnKy0tLSzr3GLicnR8YYzZ4923JSIPQoQrRZMTExWrRokaqr\nqzVu3DhNmDBB48ePV3l5+Xnfa2pq0pIlS5SUlKTffvtNJSUlWrVqlbp06WIneBANGDBAubm52rFj\nhw4dOqSEhAQ9+eSTevbZZ/Xcc8+1mtVAgECiCNHmtcyGysvL1bVrVw0bNkyPPfaYfv75Z23fvl3D\nhw9XTk6OcnJytGPHDt1www22IwfdyJEjtXXrVr322mtav369IiMjZYyRz+ezHQ0IOZ4jhHM+++wz\nLVy4UIcPH9Yff/yh1NRUrVixQr169bIdLeRqamqUmJiotLQ0bdy4UfHx8crOzv7H5aKAtoQihJN8\nPp9SUlI0ePBgvf7667bjWDNt2jQdP35cn3zyiU6ePKns7Gy98MILGj16tFasWKHk5GTbEYGg49Qo\nnOTxeNSjRw/16NHDdhRrSkpKlJeXp+zsbElSbGyslixZov379yshIUGjRo3S/fffr++//95yUiC4\nKEI4q3379jp79qztGNbMnz9fDz/8sBITE8/7/Morr9Tq1au1e/duSVJiYqLmzJmjEydOWEgJBB9F\nCGdFRUWpqanJdgwr8vPz9e233+q55577y+8MGjRIubm52rx5s7Zv3674+HgtX75cZ86cCWFSIPgo\nQjgrKirKyRlhc3Oz5s+fr7lz5/r1Uu477rhDJSUleu211/TGG29oyJAhysvLE7cXoK2gCOEsV4tw\nzZo1OnHihObPn+/3mIiICE2dOlV79uzRQw89pBkzZuiuu+4690A+0Jpx1yic9cQTT+jMmTN66623\nbEcJmfr6eiUkJGjp0qVKT0//1/upra3VRx99pIaGBg0cOFBjxoxR586dA5gUCB1mhHCWizPClStX\nqkePHpo5c+ZF7adnz55KT0/XjBkzJElvv/22CgoK1NDQEIiYQEhRhHCWa0V49OhRZWdnKysrS5GR\nkQHZZ+fOnXX33XfrwQcfVF1dnd58803t3LlTzc3NAdk/EAr/vCw30Ea59vhEZmamRo0apUmTJgV8\n37169dIDDzygmpoabdmyReXl5Ro9erQGDx7cJl5ajraNIoSzXHp8oq6uTkOGDLmo64L+uPrqq5WW\nlqa9e/dqx44d+uabbzRmzBgNGDAgqMcFLgZFCGe5dGr0yy+/VL9+/XTjjTcG/Vgej0dDhgxRUlKS\niouL9emnn6qsrExjx45Vz549g3584EJxjRDOcqUIa2pqVFNTo5tvvjmkx42KitJNN92kGTNmqEuX\nLtqwYYM+/vhj3lCDsEMRwlkuFKExRtu2bdPQoUOtPd7QqVMnjR8/Xg888IBOnjypLVu2nPvZ2rVr\nVVFRcd73KysrtWbNmlDHhMM4NQpnxcfH6/bbb7cdI6gqKytVX1+vkSNH2o6i3r17KzU1lVe0IexQ\nhHBWXFyc6uvrbccImrNnz6qoqEgjRowIq5Xno6OjbUcAzsOpUTjL4/G06RXZd+/eLY/Ho6FDh9qO\nAoQ1ZoRwVmRkZJstwtOnT+urr77SHXfcEbCH54OloKDgvOuGXq9XsbGxFhPBNRQhnOXxeOT1em3H\nCIpdu3apS5cuSkpKsh3lH6WkpCghIeHcdnV1tUpLSy0mgmsoQjirrc4If//9d5WVlem+++6zHcUv\nHTp0UKdOnc7bBkKJa4RwVlu9Rrh9+3b17dtXffr0sR0FaBUoQjirLZ4a/emnn7R//36NHTvWdhSg\n1eDUKJzVFmeEXbt21YQJE9S9e3fbUfzyyCOP/L/PEhMTlZiYGPowcBYzQjirLV4j7Nixo6699lrb\nMYBWhSKEs9rijBDAhaMI4azIyMg2d40QwIWjCOEsj+e/f/2ZFQJuowjhLIoQgEQRwmGtsQhZtggI\nPIoQzurYsaNSUlLOFSIAN/EcIZwVHR2tESNG2I4BwDL+KwwAcBozQqCVYdkiILAoQqCVYdkiILA4\nNQrntPY7L1uWLWr5w7JFwMWhCAEATqMIAQBO4xoh0IqwbBEQeBQhnMSdlwBaUIRwEndeAmhBEcJJ\nLXde/u82ADdxswwAwGkUIQDAaRHGGGM7BAAAtjAjBAA4jSIEADiNIgQAOI0iBAA4jSIEADiNIgQA\nOI0iBAA4jSIEADiNIgQAOI0iBAA4jSIEADiNIgQAOI0iBAA4jSIEADiNIgQAOI0iBAA4jSIEADiN\nIgQAOI0iBAA4jSIEADiNIgQAOO0/CLSx3rjDrOMAAAAASUVORK5CYII=\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a1800f130>"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Chem.AddHs(propene)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAD7klEQVR4nO3dIW4qaxjH4bc3FYhB\nYCuqWEKTKmRFF9AtdFE14Cu6AASitglyMMMWuoGSOeqQYM5Nys35evk/j/smmeHNmF9mBoarcRzH\nAoBQ/7QeAABaEkIAogkhANGEEIBoQghANCEEIJoQAhBNCAGIJoQARBNCAKIJIQDRhBCAaEIIQDQh\nBCCaEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhABEE0IAogkhANGEEIBo\nQghANCEEIJoQAhBNCKGB1WpVfd+fbNvtdrVcLhtNBLmEEIBoQghANCEEINp16wEg1Xq9rs1mc1wf\nDofquq7hRJBJCKGRxWJR8/n8uB6GobbbbcOJIJMQQiOTyaSm0+nJGvj7PCMEIJoQAhDtahzHsfUQ\nANCKK0IAogkhANGEEIBoQghANCGEhoZhqGEYWo8B0YQQGtrv97Xf71uPAdGEEIBoQghANCEEIJoQ\nAhBNCAGIJoQARBNCAKIJIQDRhBCAaEIIQDQhBCCaEAIQ7br1AJDs6+ur9QgQTwihobe3t6qqenx8\nbDwJ5HJrFIBoQghANCEEIJoQAhBNCAGIJoQARBNCAKIJIQDRhBCAaELIxVqtVtX3/cm23W5Xy+Wy\n0UQ/n3NGIiEEIJoQAhDNS7eJ9vn5WR8fH2cd4/X19dv7vr+/V1XV8/Pzt4/x9PT07X2rqu7u7mo2\nm511DPg/E0Iu2nq9rs1mc1wfDofquq7hRD+fc0YaIeSiLRaLms/nx/UwDLXdbo/r2WxWDw8PZ33G\nOfv/vhJ8eXk5a4b/0r+dM7g0QshFm0wmNZ1OT9b8mXNGGl+WASCaEAIQ7Wocx7H1EJDqJz4jhDSu\nCAGIJoQARBNCAKIJIQDRhBCAaEIIQDQhBCCaEAIQzbtGoaHb29vWI0A8IYSG7u/vW48A8dwaBSCa\nEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhABEE0IAovn3CWjo5uam9QgQ\n72ocx7H1EADQilujAEQTQgCiCSEA0YQQGlitVtX3/cm23W5Xy+Wy0USQSwgBiCaEAEQTQgCi+UE9\nNLJer2uz2RzXh8Ohuq5rOBFkEkJoZLFY1Hw+P66HYajtdttwIsgkhNDIZDKp6XR6sgb+Ps8IAYgm\nhABE89JtAKK5IgQgmhACEE0IAYgmhABEE0IAogkhANGEEIBoQghANCEEIJoQAhBNCAGIJoQARBNC\nAKIJIQDRhBCAaEIIQDQhBCCaEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgm\nhABEE0IAogkhANGEEIBovwBiLZZNp3I9KgAAAABJRU5ErkJggg==\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a05e1a670>"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Chem.AddHs(methane) "
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAEnklEQVR4nO3dMWpbWQCF4ZuJCxUS\nhEBcGAIpVAhClqDgKuAyO0iVRWQBWYQbaQdZgAoFb0BpIimFwIVtSJc+EZpOxqgYSZ6Z+x7n+7or\neObAA/8825KfbDabTQGAUH/VHgAANQkhANGEEIBoQghANCEEIJoQAhBNCAGIJoQARBNCAKIJIQDR\nhBCAaEIIQDQhBCCaEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhABEE0IA\nogkhANGEEIBoQghANCEEIJoQAhBNCAGIJoSwh/F4XBaLxYPXlstlGY1GlRbda/I2aAMhBCCaEAIQ\nTQgBiHZSewC0xWQyKdPpdHter9el2+1WXHSvydug6YQQ9jQcDku/39+eV6tVmc1mFRfda/I2aDoh\nhD11Op3S6/UenJuiydug6fyOEIBoQghAtCebzWZTewQA1OKJEIBoQghANCEEIJoQAhBNCOFA8/m8\n3Nzc1J6x4+bmpszn89ozoHWEEA40n8/L7e1t7Rk7bm9vhRCOIIQARBNCAKIJIQDRhBCAaEIIQDQh\nBCCaEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEf4/ft37Qk7mrgJ2kAI4UCXl5fl6uqq9owdV1dX\n5fLysvYMaB0hBCCaEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhDSKOPxuCwWiwevLZfL\nMhqNKi3iWO4lbSGEAEQTQgCindQeAIe6u7sr379/P/r6P3/+lC9fvhx9/Y8fP8qvX7/K9fX10V/j\nv/Dt27fy8+fP8vHjx6O/xvv378vJyfHfFl6/fl3Ozs6Ovh5qEEIaZzKZlOl0uj2v1+vS7XYrLuJY\n7iVtIIQ0znA4LP1+f3terVZlNpttz2dnZ49+6ri4uDj62nfv3pXz8/Py6dOnR234t33+/Ll8/fq1\nUf+K6Z/uJTSBENI4nU6n9Hq9B2fayb2kDfyxDADRhBCAaH40SqN8+PBh57XBYFAGg8H/P4ZHcS9p\nC0+EAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhHCgwWBQTk9Pa8/YcXp66s3qcASfLAMH\nevv2bXn58mXtGTvevHlTnj17VnsGtI4nQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhABEE0IA\nogkhANGEEIBoQghANCEEIJr/PgEHevXqVXn+/HntGTtevHhRnj59WnsGtM6TzWazqT0CAGrxo1EA\nogkhANGEEIBoQgh7GI/HZbFYPHhtuVyW0WhUadG9Jm+DNhBCAKIJIQDRhBCAaN5QD3uaTCZlOp1u\nz+v1unS73YqL7jV5GzSdEMKehsNh6ff72/NqtSqz2aziontN3gZNJ4Swp06nU3q93oNzUzR5GzSd\n3xECEE0IAYjmQ7cBiOaJEIBoQghANCEEIJoQAhBNCAGIJoQARBNCAKIJIQDRhBCAaEIIQDQhBCCa\nEAIQTQgBiCaEAEQTQgCiCSEA0YQQgGhCCEA0IQQgmhACEE0IAYgmhABEE0IAogkhANGEEIBoQghA\nNCEEIJoQAhBNCAGIJoQARBNCAKL9DVcE6YqqoaqKAAAAAElFTkSuQmCC\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a05e1a910>"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"Chem.AddHs(ethane)"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAmDklEQVR4nO3dd1iUV9oG8Js+VGlW\nxBYRFRGNJSgao5JiQuLajdnRFRWNroCIYh/U1UBMzLBqLBuTJYmuYc1+EXtQE3tBYkMMxBaliB1C\nL/N8f0wwkkFpw5yZeZ/fdXklcKbcMDr3nLec14SICIwxxphEmYoOwBhjjInERcgYY0zSuAgZY4xJ\nGhchY4wxSeMiZIwxJmlchIwxxiSNi5AxxpikcREyxhiTNC5CxhhjksZFyBhjTNK4CBljjEkaFyFj\njDFJ4yJkjDEmaVyEjDHGJI2LkDHGmKRxETLGGJM0LkLGGNOR8vJy0RFYFbgIGWNMBz788ENMnDhR\ndAxWBRMiItEhGGPM2F25cgU+Pj5ISEjAgAEDRMdhT+EiZIwxHQkNDcXhw4dx9uxZmJmZiY7Dfseb\nRhljTEcUCgUyMjLw2WefiY7CnsJFyBhjOuLk5ITly5djwYIFePDggeg47He8aZQxxnRIpVLhpZde\ngp+fH5RKpeg4DFyEjDGmc8ePH8fAgQORlJQEb29v0XEkj4uQMcYEGDt2LO7fv48DBw6IjiJ5XISM\nMSZAeno6OnbsiC1btmDo0KGi40gaFyFjjAmyaNEi/N///odL58/D1NJSdBzJ4iJkjDFB8vPzceP1\n19Fl2DBg9mzRcSSLi5AxxkT673+BwEAgNRVo0UJ0GkniImSMMdEGDgTc3YEvvxSdRJK4CBljTLTL\nl4Hu3YFDh4B+/USnkRwuQsYY0wfvvw8kJgJnzgCmvOiXLvFvmzHG9MGKFcDNm7x5VAAuQsYY0wfO\nzoBCAcybB+TkiE4jKbxplDHG9EV5uXpf4RtvAB9+KDqNZHARMsaYPjl0CBgyBLh0CejQQXQaSeAi\nZIwxfRMQADRpAnz+uegkksBFyBhj+iYrC7C1BRwcRCeRBC5CxhhjksZHjTLGGJM0LkLGGGOSxkXI\nnispKQl/+9vfEBgYiBs3boiOw3QpPx+YPh1o2RJwcwP691evesJ0i1+HBsdFyKqUnZ2NyZMno2/f\nvjAxMcHDhw/RuXNnLFiwAHl5eaLjMV2YNAn47Tfgl1+AjAxg7lzgrbfUB3Iw3eHXocFxEbJKCgsL\nERkZiXbt2iE7OxvJycn44osv8N133+Ho0aM4fPgwWrdujZiYGJSVlYmOqzV2dsBrr/3x9f37gKOj\nsDjipaYC+/cD69cD1tbq7739NjBiBPDJJ2KzSQm/DjrBRcgAAESEL7/8Eh06dMD27duxY8cO7Ny5\nEx4eHk9u07NnTxw7dgwbNmzA6tWr4e3tjT179ghMrV2pqcCRI6JT6ImLFwEvL/UnhKf5+qrHmG7w\n66ATXIQM58+fx8CBAxEcHIzw8HCcO3cO/v7+Vd7WxMQEo0aNwpUrVzBmzBiMHDkSr776Ki5fvqzj\n1Nq3ZAmweLHoFHpO0NlWx44dw4kTJ4Q8t17is960iotQwu7evYvx48ejV69e8PHxwbVr1xASEgIL\nC4tq72tjY4PIyEikpaWhefPmePHFFxESEoLHjx83fPAGMnw4kJcHfP+96CR6wNtbfY28P+8PPnVK\nPaZj+/btw4QJE1BcXKzz5xZKz14Ho0VMcoqKiigqKoocHR2pX79+lJSUVO/HPHXqFPn6+pKzszMp\nlUoqLS3VQlLdsbUlevSIaNcuot69ie7dI2rUSHQqwUaNIvrrX4kKCtRf79xJ5OJClJGh8yj5+fnU\nqlUr+uijj3T+3MLp0etgrLgIJWbXrl3UoUMHat26NcXHx9foPmfOnKEDBw5Ue7vy8nKKjY2lZs2a\nUceOHWnPnj31jaszFUVIRNSnD9HmzVyE9NtvRFOnErVoof7j50d08qSwOF999RXZ29tTVlaWsAxC\n6NnrYIy4CCUiOTmZ/P39SSaTkUKhoPz8/Brfd9OmTWRtbU1/+ctf6OrVq9XePi8vjxQKBclkMvL3\n96fLly/XJ7pWlZQQxccTyeVErq5EFy+qv/90ER44QNS6NRehvlGpVNSvXz+aMmWK6CjMyPA+QiOX\nk5ODkJAQdO/eHc2bN0daWhoiIyNhY2NT48eYMmUKrl27hiZNmsDLywtTp07FvXv3nnl7W1tbREZG\n4tKlS3ByckK3bt0QEhKCHEEXGy0vB378EQgOBtq2BUaNAh4+VF/urVUrzdsPHgy0a6fzmKwaJiYm\niImJwRdffIHExETRcZgxEd3ErGGUlZWRUqkkFxcX6tq1Kx06dEgrj5uUlET9+/cnJycnioqKouLi\n4mrvc+jQIeratSu5uLiQUqmksrIyrWR5nrw8othY9e4VR0f17E4uV88GCwsb/OlZA5o4cSL17duX\nVCqV6CjMSHARGqEjR45Q9+7dqXHjxhQbG0vl5eVaf474+Hhq06YNeXp60u7du6u9fcX+wyZNmlCn\nTp1o7969Ws+Um6suv4AAImtroiZNiIKDiRISiIqKtP50xiM+nuiHH0SnqLE7d+5Qo0aN6D//+Y/o\nKMxIcBEakRs3blBAQACZm5tTcHAwPXz4sEGfr6CggKKiosje3r7G+wIfPXpEERERZGVlRQEBATXa\n51hdhv/97380btw48vFJJicnovHjiXbs4JlfjTx+rP7EsG6d6CS1Eh0dTS1btqS8vDzRURrGo0dE\ntdiPz+qHi9AI/PbbbxQREUHW1tb0xhtv0JUrV3T6/Onp6SSXy8nS0pKCg4Pp8ePH1d4nNTWVAgIC\nyMLCosb3qZCfn0/bt2+nsWPHkp2dHbm4uNCkSZPowIGfqQZbauukvJwoO7thHluo8HCirl2JdLC5\nWpuKi4upQ4cOpFAoREdpGJMnE40cKTqFZHARGjCVSkWxsbHk5uZG7dq1q/HpEA3lzJkz1Ldv31rt\nC0xISKAuXbpUe5+7d++SUqkkf39/srKyonbt2lFERAQdPXq0QTb9/llUFJGPj5HNMlNTiSwtiQ4e\nrHp83z71JwA9tWPHDrK2tqYbN26IjqJdp08TmZsTnTsnOolkcBEaqFOnTlHv3r3J3t6elEpljQ5a\n0QWVSkVxcXHUqlUr6tSpE+3bt6/a+5SWltLGjRvJ1dWVOnfu/OQ+2dnZpFQqyc/Pj8zMzKh9+/ak\nUCgoOTm5oX8MDXl5RB07EhnVkfvvvEM0dGjVYwcOqEuynpuuG9obb7xBY8aMER1De1Qq9YmskyeL\nTiIpXIQGaM2aNWRubk7Dhg2ja9euiY5Tpfz8/CfnEgYEBNQoZ2ZmJk2cOJHMzMxo0KBBZG1tTc2b\nN6cZM2bQDz/8oJOjTZ/n4kUimYxo61ahMbRj3z4iKyuiql6XkhKiTp2I5s3Tfa5aSklJIQsLC/rx\nxx9FR9GOrVvVhzgb5XZ4/cVFaGAKCwvJwcGBPv/8c9FRauT27duV9h/m5ORUe5+1a9eSra0tHT58\nWCebPWvjk0/U71PXr4tOUncqVRnd/v5NKvl0adU3iIkhat5cvaKJAQgJCaFu3boJ/6BUb3l5RC1b\nEkVHi04iOVyEBqawsJAACNk8WB8//vgjdevWjZo3b04bN2587ptWQkICOTo66jBdzalU6i2KvXqp\nJ06G6O7dtXThQnMqK8vVHLx3j8jJichAPmgRET18+JBcXV1p48aNoqPUz9KlRB4e1GBHfLFn4pVl\nDBQZ2GVYBgwYgKSkJERFRWHJkiXo3bs3jh49KjrWMxUUAPHxmt83MQE2b1ZfKFyh0H2u+iore4CM\njMVo0WI5zMzsNW8QGQl4eAATJug8W105OTlh+fLlWLRokeFe/eTWLSAqSr3ckaWl6DSSw0VoYExM\nTJ45tmnTJmzatEmHaWrH1NQU48ePx+XLl9GnTx/4+/sjLi5O43YmJibCiz45GRg9Gjh4UHPM1RXY\nuhX46CMgIUH32eojK2sZrKxegKvrRI2xoqKfUVSUon4zNjWst4YpU6agRYsWWLZsmegodbNgAdC/\nP/CXv4hOIkmG9bedPVFVUSQlJSEpKUlAmtpxcXHB2rVr8dNPP2HIkCGi41Spd29g5Urg3XeBzEzN\n8QEDgLlzAbkcuHNH9/nqorAwGffufQp39xhU9U//1q0ZyFrYVP3DGRgzMzOsXbsWa9euNbyLRB87\nBsTFAZ98IjqJZHERGpjnzQgBw9pk6uXlBXt7zc1z+jAjBIBZs4A+fYD33lMv3P1nkZFA+/bAxImG\nccHwzMzFaNQoAHZ2fTXGHj+OR37+abi5rRKQTDv69euHoUOHIjQ0VHSUGiMiFEZHA+PHA507i44j\nWVyEBqaiCKsqCn0pkPrSl5/DxAT47DMgLU29tfDPzM2B2FggM7MQmzd/p/N8teXmtgLu7kqN7xMV\nIz09DE2bhsPSsqXug2nR6tWrceLECezevVt0lBrZtm0bvBITUbxihegoksZFaKCeVYRMuxo3Vu8P\nXLoUOHFCc/yFF4CIiP/DzJnv4sKFC7oPWAsyWWdYWrbW+P7du2tAVIZmzSIEpNIud3d3zJ49GyEh\nISguLhYd57lyc3Mxa9YszIyIgFXTpqLjSBoXoYExpk2jz6IvM8IKAwYA4eHA2LHq6xj+2bhx4zB+\n/HiMGDECubm5ug9YD6WlWcjKWgY3t5UwNbUWHUcr5s+fj9LSUqxZs0Z0lOeKjo6Gq6srZs6cKTqK\n5HERGiieEepWZKT6Ir5BQVWPx8TEwNbWFlOmTNFprvoyMbFCs2bz4Ow8VnQUrbG2tsbKlSuxbNky\nZGVliY5TpatXr+Ljjz+GUqmEubm56DiSx0VoYHhGKEbF/sC8vGOIjf1KY1wmk2Hr1q3YtWsXvvzy\nSwEJ68bc3BnNmi2Asb0VjBs3Dt26dcPixYtFR6nSvHnzMHjwYPj7+4uOwmBsf/slhGeEuvfCC0BQ\n0F1MmxZU5f5ALy8vfPzxx5g+fTp+/vlnAEBJSTqys1cjN/d7lJSk6zqyZJmYmCAmJgaxsbFITEwU\nHaeShIQE7Nq1CzExMaKjsN/xnNzA8IxQrOHDh0Mul2PcuHFITEyEjY1NpfFp06bh8OHDeO+993Di\nxAmUlWUhPX32k3ETE0tYWbWHtbUXZLLOT/23E7T9ufT+/c+Rnb0KRCUACM7O49GiRaRWn0Ofde/e\nHePHj0dISAiOHz+uFx8Uy8rKMGvWLMyYMQPt27cXHYf9jmeEBoZPnxBPqVSCiBAWFlbl+Pr16/Hw\n4UPMnz9f482XqARFRSl49Oi/yMpaiuvXRyMlpQt++skaly974fr10cjMjEROzk4UF18HULffQ3Hx\nL8jImIcOHQ6gS5dr6Nw5BY0avVWnxzJkH3zwAVJSUrBt2zbRUQAA//rXv/DgwQMoDHF9PiPGM0ID\nxZtGxbGxsUFcXBx69+6NAQMG4N1336007ujoiG+++Qb9+/fHa6+5o3Hj6h+zoiCLilIqfd/MzAFW\nVh6wtu4MmczryX+trNoCePbrXVp6B2Zm9jA3Vx+Wb2oqg61tr1r/rIauSZMmWLhwIebOnYt33nkH\ntra2wrI8ePAAixYtwgcffAAHBwdhOZgmLkIDw5tG9UOXLl0QHR2N6dOnw9fXF23btq003rt3b0RE\nRGDFihVQKuv+POXluSgoSEJBQeWl88zMHGFl9UKlgrSx6QkLi+YAAFvbPrCyegHJyW1hZ/cKHBxe\nhbPzWJiYSG9B55kzZ+LTTz/FsGHDNF4nXfr111/h6uqKwMBAYRlY1XjTqIHiGaF4f//73zFgwACM\nHTsWpaWlGuNjxoxpsKXXyssfo6AgCTk5e5Cb+z1ycw8gJ2c3SkszAAAmJubw8Pge7dvvhZ1dH9y7\ntx5paYMBqBomkB6ztLSEjY2N8H8fRISCgoIq/64wsXhGaGT0fSZVE4YwIwTUOTdu3AgfHx+sXbsW\ns2bNejJWWFiI0aNHY8iQPgB21fu5zM0bw8bGBzJZZ9jY9IC1tResrNrDzKzRc+9nbd0F1tZd4OIS\niPPnHVFcfBNWVu3qnceQbNy4EXl5efjuu+9gbS1u0YDS0lJ4e3tj5cqVWL58ubAcTBMXoQF6VlGI\n/sSrLYZShADQtGlT7N69Gx4eHpW+Hx4ejvLycsyfPx83b9a8CE1NZU9t6uzx5P8tLFrUKldx8TWU\nlmbAzu5lAEBBQSJMTExhYSGtpbwq9svFxMQILUEAsLCwwOrVqzFixAgEBgYK3UzLKuMiNDKGUiDG\npEePHpW+3rFjBzZv3ozjx4/D2trsGfcygUzWSeM0CpnMEyYm2vhnScjKWoGiIjlMTCxhZuaAdu22\nw9RU3MEiIvzjH/9Ap06d8N5774mOAgB48803MWjQIMyZMwfbt28XHYf9jovQAD1vRmgMRWjIP8et\nW7cwceJErFixAj169EBBwfk6b9asDyur9vDw2N9gj28ILl++jHXr1uHIkSN6tbUkJiYGXbp0QUJC\nAl599VXRcRi4CA2SsW8aNVTl5eUYP348/Pz8npxjaG3tja5ds2Bi8qyZIWsoc+fOxejRo+Hr66sx\nduvWLdy7d6/BM7i4uKBNmzaVvte+fXvMmDEDs2bNwvnz53mtUT3Ar4CRMdSZ1NMMdUa4atUqpKWl\n4cKFC08+lHABirF3714cPnwYqampVY5/+OGHWLduXYPnkMvlVa49GxkZia1bt2LTpk2YPn16g+dg\nz8enTxggnhHqn5MnTyIyMhJbtmxB45qcQc8aTGlpKcLCwjB37ly4ublVeZu1a9eCiBr8z7MWYLe3\nt8eyZcuwePFiPHjwoCF/HawGuAiNjCHOpP7M0GaE+fn5mDhxIqZNm4aBAweKjlMtohLcuvU+Skpu\nio7SID799FMUFhZizpw5oqM816RJk/DCCy9g6dKloqNIHhehATL2GaGhFWFoqAw9e85GdHS06Cg1\nYmJiiZKSDNy+HSI6itbdv38fS5cuxQcffCD8dInqmJqaQqlUYv369bh06ZLoOJLGRWiAnlcUhlQg\nxuDrr4G4ODMsXToFVlZWouPUmLv7J8jJ2Y/c3H2io2iVQqFAly5dMHasYVxouG/fvhg5ciRCQ0NF\nR5E0LkIjYmgzqWcxlJ8jLQ14/31gzRr1tQoNiZXVC2jadBZu3w4DkXEs+XXp0iX861//glKpNKit\nI6tWrcLp06exY8cO0VEki4vQABnDplGVSoXPP/8cly9fFh2lTkpKgPfeA4YOBcaPF52mbpo3X4jy\n8hzcu9fwR0/qQmhoKMaNG4cXX3xRdJRaadmyJebMmYOwsDAUFRWJjiNJXIRGZODAgXjnnXdEx6jW\nyZMn4evri7CwsCoPbzeEGWFkJJCTA2zYIDpJ3Zma2sHNLQqZmQqUlt4RHade4uPjcfbsWYPZT/tn\nc+fOhUqlgrI+lyphdcZFaICeVRRvvvmmxrXx9MmNGzfw9ttv45VXXsGgQYNw48YNDB8+XHSsWjt4\nEFi9GtiyBbCzE52mflxc/gpr667IzFwiOkqdFRcXPzldomlTw1xL1draGlFRUVixYgUyMzNFx5Ec\nLkLW4PLy8jBv3jx4eXmhvLwcFy9eRFRUFJycnKq8vT5v4r1/H5gwAViyBOhlFNe5NYG7ewwePPgC\n+fmJosPUyT//+U+Ul5dj9uzZoqPUy5gxY9CjRw8sWLBAdBTJMboiLC8vx/fffy86RoNJSUmBs7Mz\nTp06JTpKtSpOKO7YsSO2b9+Ob775Bnv27IGnp+cz71NeXo6dO3fC3d0dEREROHPmjN5sJiVSl6Cn\nJzBvnug02mNj8yKcneVITw8FoB+/65rKysrC8uXLER0dDZlMJjpOvSmVSmzZsgWnT58WHUVayMgk\nJiaSTCajQYMG0YULF0TH0ZqHDx9ScHAwmZub04ABA0gmk9HgwYPp4sWLoqNV6dSpU9S7d29ycHAg\npVJJJSUl1d7n0KFD5O3tTS4uLjRnzhwaMmQIWVpakru7O4WEhNCRI0eovLxcB+mrtm4dkYsLUXq6\nsAgNprQ0m86da0QPHmwRHaVWJk+eTC+//LLoGFoVFBREvr6+pFKpREeRDKMrQiKijIwMCgoKInNz\ncxo1ahTdvHlTdKQ6KyoqIoVCQXZ2duTr60unT58moso/o1wup8zMTMFJ1bKzs0kul5O5uTkFBQXV\nKFdycjL5+/uTlZUVKRQKysvLezJWUFBA8fHxJJfLycHBgZycnEgul1NcXFyl2+nCsWNEO3fq9Cl1\nKiXlE5LL36CCggLRUWokMTGRzM3N6aeffhIdRavu3r1Ljo6O9OWXX4qOIhlGWYQVzp49S/379ycb\nGxuKiIig3377TXSkWomPjycPDw9q1qwZxcbGVvkJMTExkfr160e2trakUCiosLBQQFKi4uJiioqK\nIkdHR/Lz86OzZ89We5/Hjx9TcHAwWVhY0KhRo+iXX3557u2LioooISGBgoODqUmTJmRjY0MBAQEU\nGxtLubm52vpRJKu4uJg8PT1p8eLFoqNUS6VSkZ+fHwUGBoqO0iBWr15NTZs2pZycHNFRJMGoi7BC\nfHw8tW3bltzc3J5ZKPrkeTOkqqhUKoqLi6M2bdqQu7s7xcbG6iip2p49e8jT05NatWpFcXFx1f5+\ny8rKSKlUkouLC3Xp0oUOHDhQ6+csLCyk7777juRyOTk6OlKjRo1ozpyT9O23RPn5df1J2M6dO0km\nk9GNGzdER3mu//73v+Tg4EDZ2dmiozSI0tJS8vLyogULFoiOIgmSKEIi9Sa2qKgocnBwoF69etHx\n48dFR9Lw6NGjSjOktLS0Wt2/4me0t7enV155hc6dO9cwQX937do1CggIIJlMRgqFgvJr0EBHjx6l\nF198kVxdXWnjxo1UWlpa7xzFxcW0d+9emj37ETVuTGRjQzRyJNHWrUQ8Uay9IUOG0KhRo0THeKbC\nwkJq27YtffDBB6KjNKiEhASytLSs9fsAqz3JFGEFfdx/WDFDcnZ2rvMM6Wnp6emV9h/euXNHS0nV\ncnNzKTg4mCwtLUkul9OtW7eqvc/Nmzdp1KhRZG5uTsHBwfTgwQOtZnpacjKRQkHUoQORmRmRnx+R\nUkmUkfH8+9naEr366h9f37tH1KhR5fGsrMrjZmbaTK4frly5QhYWFvTDDz+IjlKlFStWkIeHBxUX\nF4uO0uACAgJo2LBhomMYPckVYYWjR49Sz549af/rrxOtWkUk6h9VYiIVvPIKdWrfnlauXElFRUVa\nfOhE8vPzIzs7O1IoFPV+bJVKRbGxsdSiRQvq2rUrHTp0qNr7FBYWkkKhIBsbG3r99dcpJSWlXhlq\nq6IUO3cmMjVVl2JUFFFVuyNtbYlatSI6fFj9tVSLkIgoNDSUfHx8qKysTHSUSjIyMsjOzo6+/fZb\n0VF04urVq2RlZUX79+8XHcWoSbYIiYjKy8upNDaWqHlzIg8Povh43T35nTtEkyap30nHj6ey6qYr\ndVSx/7B169bk4eFBcXFxdXqckydPUq9evahx48Y13qQZGxtL7u7u1K5dO4rX5e/2GRITiebN+2Om\nOGAA0cmTf4zb2hJ99hlRxdH4Ui7CnJwcatasGW3YsEF0lEomTJhArz49bZeA8PBw6ty5c41OQWJ1\nI+kifKKgQD1NsLcneumlyu+O2lZYqJ6i2NgQvf46kY5mSPn5+RQVFUV2dna1Pv/w66+/JktLSwoM\nDKzRZtYLFy7QwIEDyd7enpRKpV5uwrp4Uf0yXLnyx/dsbYkePiR68UWi/furLsKWLYlat1b/cXc3\n3iIkItqwYQM5OzvT/fv3RUchIqLTp0+Tubk5nT9/XnQUncrNzaXmzZvTmjVrREcxWlyET0tPJ5LL\n1dvQ5HL1rE2bYmPV755t2+p29vmU9PR0ksvlZGFhQUFBQXT37t1q73Pnzp0anQ5x9+5dCgoKIktL\nSwoKCqKMBprlNhRbW6JHj4h27SLq3VvaM0Ii9RaTHj16UGhoqOgopFKpyNfXl6ZMmVLlmL4fCV5f\nn332GTk5OdG9e/dERzFKJkR6sn6VPklMBEJCgIsXgfBwYP58oD4XXU1OVj9eYiKwcCEQHAwIvnp2\nYmIiQkNDceXKFURERGDWrFmwtLSs02OVlZVh3bp1WLZsGTw9PRETE4NeBrgQp50dkJ4OODoCffsC\nkycDYWHA48d/jF+9CjRrpv76/n31/5eViUrc8I4fP46BAwdi586d8PDwEJZj7969WLhwIdLS0tCk\nSZNKY0OGDMHo0aMxceJEQem05/r163B3d4eFhUWl76tUKvTp0wetWrXC6NGjBaVTe/PNN2Frays0\ng7ZxET4LEfDVV0BEhPodcOVKYNSo2j1GTo56deb164GxY4GoKKBFi4bJWwdEhO3bt2POnDmQyWT4\n+OOP8dZbb9XqMfbv34/Q0FA8fvwY0dHRkMvler1o9vM8XYQHDwKTJqlLUMpFCKgvERQTE4OSkhJh\nGVq0aIGXX34Z//nPfzTG1q9fD4VCgbS0NDg6Ouo+nJaUlJTA29sbU6dORVhYmMZ4eHg49u7dK/ya\nhYcPH0bLli2FZtA6ofNRQ/DwIVFICJGFBdHQoertYUREeXlE779P5OZG1KIFUb9+RL8vf0ZE6rW4\n3NyIvL2JDh4UkbzGnt5/6O/vT8nJydXe5/r165XOIdT1cmcNoWLTaIWBA6W9afRpDx8+FPonPj6e\nLC0tKTU1VSNbWVkZ+fj4UFhYmIDfjPZERUVRmzZtqlziLjMzk+zt7WnLFsNaC9ZQcBHWVEqK+ijP\nigM/xowh+utf1QfaEKn3+bm6ElWsrXnokHqVZi2cMK4rt2/fJrlcTpaWlhQcHEyPnm6F3+Xm5lJE\nRARZW1vXaFk0xrRl6NCh9Pbbb1c5dujQIbK0tKSff/5Zx6m0o6Lotm3bVuX45MmTqX///ka/L1QU\nLsK6+PlnIkdHoj+vXTp1KtGcOWIyadGZM2eob9++5OzsTEqlksrKyp6cQ+jm5kbe3t50UM9nucz4\nXLt2jWQyGe3Zs6fK8eHDh9Nbb72l41TaERgY+MyraFQsLp6UlKTjVNLBRVgXcXHqM7P/7Isv1KdE\nGIGysjJav349NW7cmHr06EH9+/cnBwcHio6O1svTIZg0zJ8/nzp27FjlOXXXr19/blHqqzNnzjzz\nKhoVi4tPmDBB98EkxOguzCuUER13ZGZmhmnTpiEtLQ1Dhw7Fa6+9htTUVMydO7fOR5cyVl8LFixA\nbm4u1q5dqzHWtm1bhIWFISwsDKWlpQLS1R4RISQkBHK5HN27d9cY//bbb3Hp0iVER0cLSCcdfNRo\nXfz8M9CnD3D7tvpQwgpTpwIODsCqVeKyMWbkvvrqK/z9739HamoqmlUcwvu73NxcdOjQAUuWLMX0\n6VMFJay5b775BkFBQUhLS0PTpk0rjRUUFKBjx46YNm0aFixYICihNHAR1tXo0epzCzdtUp8TuGsX\n8Le/qc891KNTJBgzNkSEl19+GZ06dcKmTZs0xrduvYBFi7yRmGgKFxcBAWuooKAAnp6emDFjBubN\nm6cxvmLFCmzevBkpKSmQyWQCEkoHF2Fd5eWpT7bfuVP9ddu2wEcfAb6+YnMxJgE//fQTXnrpJZw4\ncUJj8QYi9YII3t7qz6n6avny5fjqq6+QnJyssbshMzMTnp6e+OKLLzBy5EhBCaWDi5AxZpACAwOR\nmpqKY8eOaSzikJSk/kx64gSgj4sc3bp1Cx07dsSWLVswbNgwjfEJEybg1q1b+OGHHwSkkx4uQsaY\nQcrIyEBgYAaCgnpixAjN4/4mTgTS0oBjxwB9W+xILpcjOzsb33//vcbYmTNn4Ofnh7Nnz8LHx0dA\nOunhImSMGaxVq4B//lN9/Nqfl7/MzgY8PdUrHL77rph8VTl27BgGDRqEc+fOwcvLq9IYEaFv377w\n9vaucv8naxhchIwxg1VSAnTtqj52bdkyzfGPPgKUSiA1VbMoRSAi9OnTB926dcOGDRs0xrdu3Yrp\n06dXubg4azhchIwxg7Zrl3o9/JQU9TFrT6soylGjgOXLxeR72tdff42ZM2ciLS0NjRs3rjSWn58P\nT09PhIaGIjw8XFBCaeIiZIwZvDffBGxsgO3bNcd27ADGjQNu3ABETrIqiq7ipP8/UygU2LZtGy5d\nusSLVugYFyFjzOBdvQp06aI+m+nVVzXHT58GXnpJ97metmTJEsTFxeHSpUsa1xv89ddf0alTJ2zb\ntg3vvPOOoITSxUXIGDMKs2cD+/cD588D5uai01R28+ZNdO7cGXFxcQgICNAYf/fdd/Ho0SPs27dP\nQDrGRcgYMwq//aY+SnTRImD6dNFpKhs7dixycnKwd+9ejbGjR49i8ODBuHDhAjp16iQgHeMiZIwZ\njc8+A+bOVZ8/6OoqOo3akSNH4O/vX2XRqVQq9OzZE3379q1yIXGmG1yEjDGjoVKpV5Tp3RvQh16p\nKDo/Pz+sWbNGY/zf//43wsPD8csvv8DJyUlAQgYAerYlnTHG6s7UFFizBigqEp1ELTY2Frdu3cLB\ngwc1xnJzczFv3jwsWbKES1AwnhEyxlgDqLgk1MKFCzFz5kyN8fnz52PXrl04d+4czPXt6B6J4d8+\nY4w1gF9//RU+Pj6YOlXzuoi//PILVq9ejd27d3MJ6gGeETLGmI6NGDECxcXF2LVrl+goDDwjZIwZ\nMTs79bUJKy7ycP8+0L498PixuEwJCQnYvXs3kpOTxYVglWheu4QxxoxIaipw5IjoFGrl5eWYM2cO\npk+fjvbt24uOw37HRcgYM2pLlgCLF4tOobZ582ZkZmZiyZIloqOwp3ARMsaM2vDhQF7eH5tHRXn8\n+DEWLVqEZcuWwdHRUWwYVgkfLMMYM1p2dkB6OnD8uPp6hbt3V95H+PnnwIoVtX9cT89JSE39sVb3\nKSoqQps2bXD48GE+UlTPcBEyxoxWRRE6OqoPmpk8GQgL+6MI09KACxdq/7iWlsdQUpJV6/uNGDEC\npqa8IU7fcBEyxozW00V48CAwaZK6BEUeNcr0D380YYxJwuDBQLt2olMwfcQzQsYYY5LGM0LGGGOS\nxkXIGGNM0rgIGWOMSRoXIWOMMUnjImSMMSZpXISMMcYkjYuQMcaYpHERMsYYkzQuQsYYY5LGRcgY\nY0zSuAgZY4xJGhchY4wxSeMiZIwxJmlchIwxxiTt/wHbQxRBY6Ho+AAAAABJRU5ErkJggg==\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a05e1ac20>"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# ok ok, you are not blown off your feet. Let me show you something a little bit more complicated\n",
"m1 = Chem.MolFromSmiles('COc1ccc2c(c1)[nH]c(n2)[S@@](=O)Cc1ncc(c(c1C)OC)C')\n",
"m1"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAcIAAACWCAYAAABNcIgQAAAnwElEQVR4nO3deXxM5/4H8M9kss1k\nIos1EkvTEGuR0Kolau0ibZVGq8TVhlIiihuhLmO5KiquaNJWtOUm2ouoe4uqLdziWkIVkUSI2IJY\ngmadrPP9/TG/hDGRdTLPTOb7fr28JOc5Z+ZzvGS+eZ5zzvNIiIjAGGOMmSkL0QEYY4wxkbgQMsYY\nM2tcCBljjJk1LoSMMcbMGhdCxhhjZo0LIWOMMbPGhZAxxphZ40LIGGPMrHEhZIwxZta4EDLGGDNr\nXAgZY4yZNS6EjDHGzBoXQsYYY2aNCyFjjDGzxoWQMcaYWeNCyBhjzKxxIWSMsWpSqVRYsWIFioqK\nREdhesSFkDHGqqmkpAQRERFYuXKl6ChMjyRERKJDMMaYqdi0aRMCAgKQnJyMtm3bio7D9IALIWOM\n1dCgQYPg7OyMn376SXQUpgdcCBljrIaSkpLQo0cPbN++Ha+//rroOKyOuBAyxlgtzJw5E7t27cL5\n8+dhY2MjOg6rA75ZhjHGamHJkiXIy8tDeHi46CisjrhHyBhjtbRx40ZMmTIFycnJaNOmjeg4rJa4\nEDLGWC0REQYOHIjmzZtjy5YtouOwWuJCyBhjdZCYmIgePXrgl19+wauvvio6DqsFvkbIGGN10KVL\nF4QEBaH0+++BkhLRcVgtcI+QMcbqKjsb6NABmD1b84eZFC6EjDGmD//8JxAUBKSkAC1bik7DaoAL\nIWOM6QMRMGAA0LYtEBMjOg2rAS6EjDGmL2fOAL16AQcPAj4+otOwauJCyBhj+jR1KnDiBHDqFCCV\nik7DqoHvGmWMMX1atgy4eROIihKdhFUT9wgZY0zfvvsOmDMHuHgRaNpUdBpWBS6EjDGmb2o10KcP\n0K0b9wxNABdCxhirD6dPA717A0ePAi++KDoNqwRfI2SMsfrg7Q189hlQVCQ6CasC9wgZY4yZNe4R\nMsYYM2tcCBljjJk1LoSMMWYIeXmah+3d3ABXV6B/f+DkSdGpGABL0QEYY8wsBAQAVlZAaiogkwE7\ndwLDhwMJCYCLi+h0Zo17hIw1ZNwLMQ4XLwJ79wLffKMpggDw5pvAqFHA6tViszHuETZ0BQUFCAsL\nQ0FBAYYNGwYfngjYvHAvxDgkJACdOwMKhfb23r2BzZvFZGLluEfYgO3atQtdunTB2rVrceHCBQwe\nPBgjR45Eamqq6GjMELgXYvz46TWjwIWwAUpKSsKgQYPw7rvvYty4cUhNTcW2bduQlpYGhUKBjh07\nYvz48bhz547oqHqlUADDhj3+PjMTcHQUFke8ynohCQlCIp0+fVrI+wrXtSuQlATk5mpvP3FC08aE\n4kLYgOTk5GDGjBno0aMH3NzckJqaikWLFkH2/72B1q1bIyYmBseOHcPVq1fh4eGBRYsWQaVSCU6u\nPxcvAocPi05h5AT1QlJSUvDSSy/h2LFjQt5fqA4dgKFDgU8+Acp+3n75Bdi2DZg5U2w2xoWwISAi\nxMTEoEOHDti/fz92796NmJgYuLm5Vbj/iy++iMOHD2PDhg3YuHEj2rdvj3Xr1kGtVhs4uf4tXAgs\nWCA6hZEwsl5Ihw4d8PHHH+Pjjz9GcXGxwd9fuPXrATs7wMNDc+NSaKimGLZsKToZI2bSzp8/TwMG\nDCB7e3sKDw+noqKiGh1fWFhI4eHh5OjoSD179qRDhw7VU9L6Z2dH9PAhkZcX0d69RPfvEzk4iE4l\nmJ8f0bhxRPn5mu937iRq3Jjo1i0hcR4+fEhNmzal8PBwIe/PWEW4R2iisrOzMWPGDHh5eaF169a4\ncOECZsyYASsrqxq9jrW1NWbMmIG0tDQMHjwYw4YNw5tvvonLly/XU/L6JZEAS5Zwr7CckfVCnJyc\nsGzZMixcuBAZGRlCMjD2NC6EJoaeGAY9cOAA9u7di5iYGLi6ulZ63J49eyod+nR2dkZoaCgSEhIg\nk8nQqVMnTJ48Gffv39f3KejNjRvAunW624cPB6RSYMcOw2cyOgoFsHYtcOuW5s///qe5WUaggIAA\ndOzYEfPmzROag7FyorukrPoSEhLIx8eHGjVqVKNh0Js3b5KjoyN169aN9u/fX61jjh8/Ti+//DI5\nOTlRaGgoFRQU1CW63ty5QxQRQdS3L5FEQtSjh2Y4lEgzNProkebruDiiNm14aNRY/f777ySVSk16\nKJ41HNwjNAFZWVmYMWMGvL290aZNG6SkpNRoGNTV1RXp6ekYMWIE3nzzTQwePBhnzpyp9JjevXvj\n6NGjiIqKwtq1a9G1a1ds3boVJOCOw4wMYM0aoGdPoEULzfPHfn7A9evAH38ATk66xwweDLi7Gzwq\nqyZvb298+OGHCAwMRElJieg4zNyJrsTs2dRqNUVHR1OLFi3ohRde0Mtvz+np6fTxxx+TpaUl+fn5\n0bVr16o8Jj8/n0JDQ8nBwYF69+5NR48erXOOqty9SxQerun5WVgQdexIFBpKdPVqvb+1aYqPJ/L2\nJiosFJ2k2h48eECNGzemyMhI0VHqz08/ESmVolOwKnAhNFInT56kXr16UePGjSkqKoqKi4v1+vqn\nTp0iHx8fksvlFBISQllZWVUek5mZSUFBQWRlZUV+fn50Vc9VKT+/mLZtI3r3XSKZjKhlS6IZM4iO\nHydSq/X6Vg2LWk300kuafywT89VXX5GTkxPdu3dPdBT9y8sjcnPT/AbHjBoXQiOTmZlJ/v7+ZGlp\nSUFBQZSZmVmv77djxw7y8PCgJk2aUHh4OJWUlFR5zIULF8jPz49kMlm1i+izZGdnU3R0NPn6+pKd\nnR116XKXQkKIEhNr/ZLmZ9MmImfnxxdLTUhpaSn16tWLAgICREfRv+XLNReqVSrRSVgVuBAaidLS\nUgoPDydnZ2d66aWX6NSpUwZ776KiIoqKiqKmTZtSx44daefOndU6Li4ujrp3716jIlr2fr/++itN\nmDCBHB0dydHRkSZMmEC7d++u8XOQNRESQrR0ab29vBgqFVHbtkRffFFx++rVRN99Z9BINXXs2DGS\nSqV0/Phx0VH0JyODyN6e6McfRSdh1cCF0AicOHGCevbsSU2bNqXo6GgqLS0VkuPhw4cUEhJCNjY2\nNGTIEDp37lyVx5SWllJsbCy1adOm0iJaUFBAsbGx5OvrSzKZjJo1a0ZBQUF05MgRg51vfDyRra3m\nYfsGIzSU6PnnK742eOOGZox52zbD56qhv/zlL+Tt7V3tX6aM3tSpRH368Ji+ieBCKND9+/fJ39+f\nrKysKCgoiB4aydDW9evXyd/fn6RSKfn7+1NGRkaVx+Tl5VFoaCjZ29uXF9HCwkLasWMH+fv7k6Oj\nIzVp0qS8+In6wAsLI2rWTNjEKnqlfphJ5OREFB1d8Q4TJhD5+Bg2VC3dvXuXHB0dKSoqSnSUuktM\nJLK0JDp2THQSVk1cCAUoKSkpHwbt06cP/fHHH6IjVejEiRPUt29fsrOzo5CQEMrJyanymGvXrtGY\nMWPIxsaGWrRoQTKZjEaOHElbtmyhvLw8A6SunFpNNGIE0YABRKbe+bhxI4gyf3yPqKIe9e+/az6M\njfT/VkXWrFlDzs7OdP/+fdFR6sbXl+idd0SnYDXAhVCALVu2kJOTE0VGRhr9UJBarabY2Fhyd3cn\nV1dXioqKqlbmKVOmUL9+/Sg7O9sAKWvm4UPNZbWFC0Unqb38/PN0+rQl5eY+o9fxyitE/v6GDVVH\nJSUl1K1bN5oyZYroKLW3fz+RjQ1RWproJKwGuBAK8P7779MME7vVvWxybgcHB/Ly8qL//ve/le6v\nVCrJ19fXMOEq8awbWsuuF+7bZ9g8+pKa+galpY2quHH7diK5nOjmTcOG0oMjR46QVCql+Ph40VFq\nrrSUqFs3k3yMxdzxzDICWFpaio5QY09Ozj106FC8+uqrGDp0KBITEyvcXyqVCp8xZNMmzWw0OTm6\nbS++qJmce9w44PZtw2eri+zsfcjOPgBX1y902ohKcc1xNQq/WaiZZNvE9OvXD++//z6mTZtmesuC\nbdwIpKcDSqXoJKyGuBAKYGlpidLSUp3txcXFuHLlilF/ADRu3BihoaGIj48HEaFnz564cuWKzn7P\nOkdDGjkSaNQIGDu24rVo//pX4OWXNe2Co1YbUQnS02eiWbNpsLHRnUMuM3Mtsh0vwmrcNAHp9GPV\nqlVITU1FdHS06CjVVlBQgF9//hlF8+ZVPOcfM2pcCAV4Vm/p+vXreP7555GdnS0gVc10794dcXFx\n+O233+BewaSelpaWwnuENjbAli2aFesjI3XbJRJgwwbg2jVg6VKDx6uVP//chuLiDLRo8ZlOW2lp\nFm7fXoyWLRfDwkIhIJ1+NG/eHAsWLMDcuXPx6NEj0XGqJSwsDDMSE4GgINFRWC1wIRTgWUWibMhU\ndE+qJno/Y0kfqVRqFOfx/PPAd98Bs2drFmZ/mpOTphiGhQHHj98wfMAacnQcifbt42Bp2Vin7c6d\nFbCyaoHGjT8SkEy/ZsyYgebNm0NpAsOMGRkZWLFiBT7//HNYW1uLjsNqgQuhAM8aNpRKpQAgvCel\nD8bQIyzz7rvApEmaIdCsLN32V14BFi/+F0aP7ovMzEyD56sJicQKcrmXzvaiouu4d281WrUKh0Qi\nFZBMvywtLREeHo5vvvkGZ8+eFR2nUosWLUL37t3h5+cnOgqrJS6EAjxraLSsR2gsBaQujOFmmSf9\n4x+AoyMwcWLF7bNmjYG3tzf8/PyMoidbU7dvL4C9/UDY2w8SHUVvBg0ahJEjRyIwMFDI8l/Vcf78\neaxfvx6rVq0SHYXVARdCAZ7VIzTFodFnMYabZZ5Udr1w/37gq6902yUSCTZs2ICrV69i2bJlhg9Y\nR02aTISbW8P7MF61ahXOnTuHH374QXSUCoWEhGD06NF48cUXRUdhdcCFUIBn9ZZ4aLR+eXgAX34J\nrFxZgvPnL+q0Ozk5YfPmzVi+fDni4uIEJKw9hcIHtrYdRcfQOzc3N8yfPx/BwcHIqmhcW6B9+/bh\n0KFDWLFihegorI64EApQ1c0yxlZAasPYhkbLjB8PvPHG3zB69Ajk5ubqtPfu3RtKpRLjxo1DRkZG\n+faCgksgKjZkVPb/Zs2aBScnJyxevFh0lHKlpaUIDg7GjBkz4ObmJjoOqyMuhAJUdbOMMQ0p1pax\nDY0+afXqxZDJZPjoo4rvrgwJCcFLL72EsWPHlp9DcnIX/PGHNRISWiI1dSiuX5+Me/fWIDs7DoWF\nus9R6lNm5nokJXVEYuLzSEx0x+3bi+r1/YyNtbU1IiIiEBERgYSEBNFxAAD//Oc/ce/ePcybN090\nFKYHpjfFSQNgDjfLGOPQaBkbGxvExsbC29sbX3/9NaZOnarVXna90MvLC8uXL8ff/vY3SCSWICpG\ncXEGioszdF5TKnWCjY07ZLJOsLXtDBsbd9jadoKtbYc63cVZWJiKW7fmolOnM7CycoVaXQCV6nyt\nX89UDRkyBG+99RYCAwNx6NAhSCQSYVny8vKwcOFCKJVK2NvbC8vB9IcLoQBVFUJj7UnVhLEOjZbx\n8PDAt99+i/Hjx6N3797w8tJ+JMHZ2RkbN27EkCFD8PLLL8PZufJiVlr6CPn5p5Gff1pru0RiDWtr\nN9jadoJM1vmJvzvAwsKuypzFxXcgldrD0rI5AMDCwhZ2dr1qeLYNw8qVK9G5c2dMnz4dL7zwQvn2\nkpIS5Dw1j55KpUJBQYHWtuzsbK2fLbVarXPdsbCwEPn5+VrbcnNzUVz8eFg8JycHdnZ2CAgIqPM5\nMePAhVCAyoZGJRKJUReQ6jLmodEyo0ePxoEDB/Dee+/h999/h4ODg1Z7//79oVQqMXbsWPz6a+2u\nIhAVobDwCgoLryAr6xetNisrF8hknWFtrd2TfHLqNDu7l2Fj8zwSE5+DQvEKGjUaCmfn9yGRmN+D\n28899xw6duyIAwcO4MQTsyNYWlrq9MxkMhlsbW21tjVq1Kj88kPZcU/PimRtbQ07O+1fUOzs7LQe\nlE9LSyu/m7Vnz551Pi8mHhdCASobNjT2nlR1GfPQ6JPWrFmDPn36YNKkSYiNjdVpDwkJwbZt21Ba\nmgoLPV9Rf3KYVSp1hFzeHTJZNzg6vgmFwgcSiRUkEku0a7cPKlUicnMP4/79b5CZ+S08PQ/B3C7x\nb968GTdu3MDly5fh6OgoNMv9+/cxefJknDx5Uqu4MtPEhVCAyoqdsUxNVlemch62trbl1wvXrl2L\nKVOmaLXv3r0bSUlJkEoVFU7cXVMSiRQ2Np6ws/OGXK75I5N1hlRa+UTNMlkXyGRd0LjxRzh71hGF\nhdcqnHS7ocrPz8ecOXOwYMEC4UUQAEJDQ+Hp6YnvvvsOkydPFh2H1REXQgEqGzY0lZ5UVUzpPDw8\nPLBmzRpcvKj9bOHdu3cREBCAxYsXw9IyAsU1fHrCwkIBubxbecGTy71ha9uuRsOahYVpKC6+BYXC\nBwCQn38KEokFrKya1yyMiYuIiIBcLte5sUmUZs2aYcmSJfjss88watQoNGnSRHQkVgdcCAWorEiY\nUgGpjKmdx4QJE3S2TZ48GZ07d0ZwcDCSkr6u9Piyu0Tlcu/y3p6VVUs9JCNkZCxDQYE/JBJrSKWN\n4O7+U7VutGko7t69i2XLliE6OhpWVlai45SbOnUq1q9fj/nz5yMqKkp0HFYHXAgFqGzY0FSGFKti\n6uexbt06HDlyBOfOnYOFhQUkEs2PikRiDZmsK2SyTjUa2qwtGxsPtGu3t15e21QsWbIEPXr0wDvv\nvFOt/YuLiyucLKGiJZ2eviMU0KwtqFKptLYpFAqdlVakUikiIyMxYMAABAQE8DRrJowLoQDcIzRu\nFy9exKxZs7Bu3bryWUNatlwCKys3yOXdIJU6ig1oRpKSkvDtt98iPj6+wvaZM2ciPDxcr+9pY2MD\nuVyutc3T0xPHjx/X2bdv374YM2YMpk2bhvj4eFjo+44qZhBcCAWo6mYZUy0gTzLVQlhcXIyxY8fi\n7bffxgcffFC+3dl5rMBU5mvu3LkYPXo0evToUWH77NmzMW7cOK1tVlZWUCh0FyZ2qmDleIVCUefh\n1rCwMHh6emLDhg38bKGJ4kIoQFU3y5jykGKZsqFRIhI6C0hNLV26FJmZmThw4IDoKNVCVNog1h+s\nyP79+3Hw4EGdm5ie5ObmJnyuz+bNm2PhwoUICQnBiBEj0Lix7qLJzLhxP14AcxkaBUxrlpxDhw4h\nNDQUP/zwg87D9cbowYNoXL78uugY9UKtVpvUpNZBQUFwdXWFUqkUHYXVAhdCAcxhaNTUJhDPywOW\nLFmNwMBA9OvXT3ScamnU6DXk5Z3Cw4fGuVZfXcTExODu3bsmM6m1paUlIiMjERUVhTNnzoiOw2qI\nC6EA5jA0amoTiM+aBWRlbcbnny8XHaXarKyaw8VlIW7e/CtKS41rrb66yMvLw/z5801uUuv+/fvj\n3XffRWBgIEgfsy8wg+FCKAAPjRqXLVuAH34ANm60ha2tjeg4NdKs2XRYWjZHRsYS0VH0ZtWqVXB2\ndsakSZNER6mx1atXIzExERs3bhQdhdUAF0IBzGWKNcD4e4Q3bgBTpgArVgAdTXCBd4nEEq1bR+Le\nvQioVMaxVl9dZGRkYOXKlVixYoVJzuHZokULzJ8/H3PmzMGff/4pOg6rJi6EAjSkKdaSkpJw48YN\nne2mMDSqVgMBAUC/fsC0aaLT1J5C0R+OjiNx40YgANMekluwYAH69OmDN954Q3SUWvv000/h7OyM\nxYsXi47CqokLoQANYWg0Ozsbs2bNgpeXF3bs2KHTbgpDo2vWAOfPA99/D5jQEx4VcnMLQ37+GTx8\nuEV0lFr7448/EBMTg5UrV4qOUifW1taIiIhAZGQkzp07JzoOqwYuhAJUNvwZERGBt956y8CJqq+0\ntBRr1qxB27ZtcfLkScTHxyMwMFBnP2MfGj13Dpg3D4iKApo1E52m7qyt3eDi8hlu3pyJ0tJs0XFq\nJTg4GP7+/lqL7pqqwYMH4+233+YbZ0wEF0IBKuv19erVC61atTJwouo5duwYevXqheXLlyM8PBxH\njhxB9+7dK9zXmIdGVSrggw+A8eOBt98WnUZ/mjefDanUARkZfxcdpcZ2796N+Ph4LF26VHQUvVm9\nejXOnDmDTZs2iY7CqsCFUABTe1bw7t27GD9+PF555RX0798fKSkpGD9+fKUzxiQlJcHNzQ3ffvst\nUlJSDJi2an/7G1BaCqxeLTqJfkkk1mjV6kvcu7cGBQUXRMeptpKSEsyePRvBwcFo2VIfK3YYh1at\nWmHevHmYPXs2srIazuMtDREXQgMrLCzE1q1b0bZtW6xfvx5qtVp0pGcqKirCihUr0KFDB1y9ehWn\nTp3CmjVrKl0Y9cGDB5g8eTKGDBkCHx8fHDx4EJ07d0b79u0RHByMw4cPC71uGB8PREZqrgvaNcCV\njBo1Goa0tA8xcaLpzHDy/fffIzc3F3PmzBEdRe+Cg4Ph4OCAv//d9HrpZoWYwfz666/Url078vDw\noLlz51LLli3phRdeoH379omOpmPv3r3k6elJrVq1otjYWFKr1ZXuX1hYSEqlkuzs7Oi1116jS5cu\nlbc9ePCAYmNjyd/fn+zt7Ukul5Ovry9FRUXRnTt36vtUtBQXEx08aNC3NLi0tDSytbWlrVu3io5S\npaysLGrWrBmtX79edJR6s3fvXrK0tKSEhATRUdgzcCE0gMTERBo0aBA1atSIwsPDqbi4mIg0xSM8\nPJwcHBxo4MCBdPr0acFJia5fv06+vr5kbW1NSqWScnNzqzxmz5495OnpSW3btqUdO3ZUuq9KpaL9\n+/dTUFAQubi4kFQqpb59+1JoaCglJyfr6zTMnlKpJDc3N8rJyREdpVKfffYZeXt7U2lpqego9ert\nt9+mwYMHi47BnoELYT3Kzs6moKAgsra2Jn9/f7p9+3aF+2VmZlJQUBBZWVmRn58fXb161bBBiaig\noICUSiXJ5XIaNmwYpaSkVHnMtWvXyNfXl2xtbUmpVFJeXl6N3rOoqIj2799PgYGB1Lp1a5JIJDRi\nhJIWLyY6e7a2Z8KIiPLz88nd3Z3mzZsnOsozXbt2jWQyGR1s6F100vyCKZfLKTY2VnQUVgEuhPVA\nrVZTdHR0+dDn4cOHq3VcSkoK+fn5kVwup5CQEMrKyqrnpBq7du2idu3aUevWravs0RFpF01fX1+6\nfPmyXnKcPn2a/vGPBOrWjQggeu45ok8/Jfrvf4lKSvTyFmbl559/Jmtr62r9UiPC2LFjafjw4aJj\nGMyiRYtMopdujrgQ6tn58+dpwIAB1LhxY4qKiiofBq2JuLg46t69OzVp0kRrKFXfrly5Qr6+vmRj\nY1PtHt2uXbvIw8OD3N3dq1U0a+v+faLoaCJfXyIbGyK5XPN1dDTRo0fPPs7OjmjoUO3XcXDQbs/I\n0G6XSvWd3ngMHz6chj75D2IkTp48SdbW1nThwgXRUQxGpVIZfS/dXHEh1JOsrCwKCgoiGxsbCgoK\noszMzDq9XmlpKUVHR5OLiwt16NBBr0MqKpWKlEolyWQyeu211+jixYtVHlNWNBUKBYWHh1NhYaHe\n8lQlL49oxw4if38iR0dN4erblyg0lOiJe3KISFPoWrcmOnRI8725F8LLly+Tra0t/ec//xEdpZxa\nraaXX36ZPvnkE9FRDG779u1G3Us3V1wI9eGnnyi5Xz/q0b273q935ObmUmhoKNnb29PgwYPpzJkz\ndXq92NhYcnd3pzZt2lSrR/dk0fT396f09PQ6vX9dqVREO3cSTZxI1KwZkYUF0ahRj9vt7Ii++47I\nx0fzvbkXQiKi+fPnU+vWrat145Mh/Pvf/yYHBwe6d++e6ChCGGsv3ZxJiHj+n1pLSQGCgjQPpymV\nwPTpgJVVvbzVrVu3sGTJEqxfvx5jxozBihUr4OLiUu3jr1+/jtmzZ2P79u2YNm0aFi9eXOUq7Fu3\nbsXcuXNha2uLiIgIDBo0qK6noVdqNXD8OHDnDjBqlGabQgGkpwNDhgDLlwNeXoCHB1C2EIBCATg5\nAWULG6jVwO3bgAnNb1BjKpUKnTp1wvjx44VPBF1YWIhOnTph0qRJmDt3rlZbcnIy8vPz0bNnT0Hp\n9EetVuP48ePo27evTltKSgq6desGPz8/uLm5lW8vKipCXl6e1r55eXkoKirS2vbnn39qTdtWUlKC\nnJwcrX1UKhUKCgq0tuXk5GhN5OHk5IS0tLSan1wDZCk6gEl68ACYORPYvBn45BPN387O9fqWrq6u\niIqKwuTJkzF79mx4eHhg+vTpmD9/frUWL01PT4dKpcKFCxfg4eFR6b4XLlxAUFBQ+ZRXU6dOhVU9\nFfi6sLAAKvicgUQCLFkCLFgA7Nql237qFNCihebrzMzHXzdUMpkMYWFhGDt2LHx8fPDcc8+Vt1X0\n4Zufn4/CwkKtbVlZWVqTP5SWliI7W3tO04KCAqhUKq1tT3/4Xrp0CSqVCkFBQTo5Y2JisHPnTpw9\ne9Yo/7/VxI8//ohZs2bhypUrOj+frq6ucHR0xO3bt7WKnLW1NeyemuWhWbNmsLa21trm6OioNauT\nVCpFo0aNtPaxtbWFTCbT2mZvb18+9SEAra/NHfcIa0KtBiIiNJ+ynp6aKUq8vIREiYuLw6effopH\njx5BqVQiICCgzuu35ebmYv78+Vi7di3ee+89hIaGmtyUVwoFcPMm4OgI9OkDTJyoWX3+yR7h5cu6\nhbAh9wjLTJ8+HZGRkVXuJ5fLYWOjvUCxg4MDLCweT0RV2w/fO3fu4NKlS0hNTdUpECqVCp07d8bH\nH3+s01s0JXl5eWjfvj0WLlyIyZMn67TPnTsXBw4cQHx8vNa/KRNI6MCsKTlxgqhnT82Fqehooipm\nWjGEoqIiioqKombNmlGnTp1o165dtX6t6OhocnV1pS5dutBvv/2mx5SGZWf3+K7SuDiiNm34GuGT\nHj58qPXH0LfyFxUVUceOHenTTz+tsP3f//43yeVyunbtmkFz6ZNSqaQuXbpQSQXP/Fy9epVsbW1N\n+mesIeJCWJV79zS3K1pZEQUFVX7vviAPHz6kkJAQsrW1pSFDhtC5c+eqfWxiYiINHDhQZ9YbU/Vk\nISQiGjiQC6GxiYuLI0tLy2f+P33jjTfIz8/PwKn048aNGySTyZ75S+mYMWPorbfeMnAqVpWGXQir\n+tTLzSX65BMiV1eili2J+vUjio9/3P7DD0QtWhB5exMdP2643LV0/fp18vf3J6lUSv7+/pTx5Lk/\npexxj7JZbyrblzF98/Pzo379+lU4h21qairZ2NjQ7t27BSSrmw8//JCGDRtWYdvRo0f50QkjZd6F\n8L33iMaNI8rP13y/YwdRkyZEZVOhLVhA9M03RCY2D+KJEyeob9++ZGdnR0qlkvLLzo8ez3rj4uJC\nvXr1opMnTwpMysxVeno6KRQK2rx5c4Xt8+bNo3bt2lFBQYGBk9Xe77///syebtmzk4GBgQKSsaqY\nbyFMSdE8nf30NZLJk4mCgw2XsZ6o1WqKjY2l5557jtzc3CgqKorOnj1LPj4+1KRJE4qOjm7wEx0z\n4/b5558/c8qxvLw8atu2LX3xxRcCktXOK6+8Qh999FGFbT/99BM5OzvTgwcPDJyKVUfDL4Rubpo7\nJtq0IWrV6nEhjI3VTE/ytA0biF591YAh61dOTg4tXLiQ5HI5ubi40AcffEC3bt0SHYsxKiwsJE9P\nz2dOOfavf22iIUOiyRRG7Xfu3El2dnYV/mwVFBSQu7u7SRV1c9OwH5+o7F75rVuBNWuA//1P+5gN\nG4AtW4A9ewyftx5lZGTAxsYGzvX8vCNjNbF//374+voiISEBnp6eOu2vvw44OGge1TVWxcXF6Nq1\nK8aMGQOlUndB5NWrV+Orr75CcnKyzjOBzDiY70MsXbsCSUlAbq729hMnNG0NjIuLCxdBZnSGDh2K\n4cOHY/r06RW2f/kl8PPPwMGDhs1VE+vWrUN+fj7mzJmj0/bgwQMsXboUy5Yt4yJoxMy3RwgAo0cD\nNjbAunWATAb88gswYQKQkACY2IPkjJmqtLQ0dO36AnbsOIkhQzrrtIeEaH40z56ttxkMay0rKwse\nHh5YsWIFPvroI532mTNn4tSpUzhy5IjWbDDMuJhvjxAA1q8H7Ow0k1G6ugKhoZqfOC6CjBnM888/\nD6XyFqZO7YynZnYDoJnGNy9P0zs0Np9//jlat26NCRMm6LSlpqbi66+/RlhYGBdBI9ewe4SMMZNQ\nVKS5IvHBB5rC97QtW4BJk4ALFzS/sxqDtLQ0dOrUCXv27MHAgQN12keNGgWpVIrY2FgB6VhNcCFk\njBmFvXuBd94BEhMBd3fd9sGDNVc2fvzR8Nkq8v777yMnJwe7KpjZ/ciRIxg2bBiSk5O1JjlnxokL\nIWPMaLz1lmb1kO3bddsuXAC6d9fc0F1BB8ygjh49ioEDByIhIQEdOnTQaiMi9O7dG/3790dYWJig\nhKwmeB0OxpjRCA8HOnfWLJ81fLh2W8eOwNy5mlXQRCIi/PWvf0VAQIBOEQSATZs24cqVK9i7d6+A\ndKw2uEfIGDMqixYBP/ygGSK1tRWdRldsbCwmTZqEy5cvo2nTplpt+fn58PT0RHBwcIVrLjLjZN53\njTLGjE5IiGbpz1WrRCfRVVhYiLlz5yIkJESnCALAl19+Cblcjk8++URAOlZb3CNkjBmd7duBMWOA\n5GSgbVvRaR4LCwtDZGQkUlJSYPtUd/XOnTto3749YmJiMGLECDEBWa1wIWSMGSVfX818F9u2iU6i\nkZmZiXbt2iEiIgLjxo3TaZ86dSouXbqEuLg4AelYXXAhZIwZpZQUoFcv4Px54+gVTp8+HfHx8YiP\nj9d5QD4xMRFeXl6Ij49Hjx49BCVktcWFkDFmtP78E3B0FJ0CSE5ORrdu3XDgwAH4+PjotA8fPhzO\nzs7YuHGjgHSsrvjxCcaY0TKGIggAu3btwquvvlphEdy3bx9+++03XLp0SUAypg/cI2SMsWooKCjQ\nuUGmtLQUXl5e8PX1xbJlywQlY3XFj08wxlg1PF0EASA6Ohr37t3DvHnzBCRi+sKFkDFmEhQKYNiw\nx99nZoodOs3Ly8OCBQuwaNEiKBQKcUFYnXEhZIyZjIsXgcOHRafQWLlyJZydnTFx4kTRUVgdcSFk\njJmMhQuBBQtEpwDS09PxxRdf4IsvvoBUKhUdh9UR3yzDGDMJCgWQng4MGQIsXw54eWnW1P7zT037\nnj1ATs7j/UtKtL8HgPx86Cz+++jRXK3vCwsLkZ+fr7UtJycHJSUl5d/fu3cPFhYWOHjwYF1PixkB\nLoSMMZOgUAA3bwJHjwJLlmhWqHiyEA4bBqSlPd7f0hKwt9d+DblcM1vNk5yd3weRuvx7a2tr2NnZ\nae1jb28PS8vHT5s1adIE06ZNg0wm08epMcG4EDLGTEJZIXR0BPr0ASZOBGbNelwIGastfqCeMWZy\nli4FAgJEp2ANBd8swxgzOYMHA+7uolOwhoKHRhljjJk17hEyxhgza1wIGWOMmTUuhIwxxswaF0LG\nGGNmjQshY4wxs8aFkDHGmFnjQsgYY8yscSFkjDFm1rgQMsYYM2tcCBljjJk1LoSMMcbMGhdCxhhj\nZo0LIWOMMbP2f90UnnsNSC8EAAAAAElFTkSuQmCC\n",
"text/plain": [
"<rdkit.Chem.rdchem.Mol at 0x7f6a05e1a830>"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# now we remove a methyl group on the left to show you similar\n",
"m2 = Chem.MolFromSmiles('Oc1ccc2c(c1)[nH]c(n2)[S@@](=O)Cc1ncc(c(c1C)OC)C')\n",
"m2"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"# Let us generate fingerprints and calculate the similarity (Jaccard) between the two\n",
"fp1 = AllChem.GetMorganFingerprint(m1, 2)\n",
"fp2 = AllChem.GetMorganFingerprint(m2, 2)\n",
"\n"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"1.0\n",
"0.885496183206\n",
"0.0547945205479\n"
]
}
],
"source": [
"print DataStructs.DiceSimilarity(fp1, fp1) # identical\n",
"print DataStructs.DiceSimilarity(fp1, fp2) # very similar\n",
"print DataStructs.DiceSimilarity(fp1, AllChem.GetMorganFingerprint(Chem.MolFromSmiles('CC=O'), 2)) # dissimilar"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 2",
"language": "python",
"name": "python2"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 2
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython2",
"version": "2.7.6"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment