{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import json" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "with open('data/interactions.json') as f:\n", " ddi_json = json.load(f)" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Unnamed: 0 | \n", "name | \n", "state | \n", "level4 | \n", "level3 | \n", "level2 | \n", "level1 | \n", "Molecular Weight | \n", "logP | \n", "Water Solubility | \n", "... | \n", "Rotatable Bond Count | \n", "Polar Surface Area (PSA) | \n", "pKa (strongest basic) | \n", "Ghose Filter | \n", "Monoisotopic Weight | \n", "MDDR-Like Rule | \n", "Polarizability | \n", "H Bond Acceptor Count | \n", "Physiological Charge | \n", "Rule of Five | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "5 | \n", "Bivalirudin | \n", "solid | \n", "B01AE | \n", "B01A | \n", "B01 | \n", "B | \n", "2180.2853 | \n", "-14.00 | \n", "0.04640 | \n", "... | \n", "66.0 | \n", "901.57 | \n", "11.88 | \n", "0.0 | \n", "2178.985813 | \n", "1.0 | \n", "218.54 | \n", "37.0 | \n", "-4.0 | \n", "0.0 | \n", "
| 1 | \n", "6 | \n", "Leuprolide | \n", "solid | \n", "L02AE | \n", "L02A | \n", "L02 | \n", "L | \n", "1209.3983 | \n", "-2.40 | \n", "0.03380 | \n", "... | \n", "32.0 | \n", "429.04 | \n", "11.92 | \n", "0.0 | \n", "1208.645462 | \n", "1.0 | \n", "125.24 | \n", "16.0 | \n", "1.0 | \n", "0.0 | \n", "
| 2 | \n", "13 | \n", "Goserelin | \n", "solid | \n", "L02AE | \n", "L02A | \n", "L02 | \n", "L | \n", "1269.4105 | \n", "-5.10 | \n", "0.02830 | \n", "... | \n", "33.0 | \n", "495.89 | \n", "10.91 | \n", "0.0 | \n", "1268.641439 | \n", "1.0 | \n", "130.74 | \n", "18.0 | \n", "1.0 | \n", "0.0 | \n", "
| 3 | \n", "25 | \n", "Gramicidin D | \n", "liquid | \n", "R02AB | \n", "R02A | \n", "R02 | \n", "R | \n", "1811.2530 | \n", "5.96 | \n", "0.00390 | \n", "... | \n", "50.0 | \n", "519.89 | \n", "NaN | \n", "0.0 | \n", "1810.033419 | \n", "1.0 | \n", "194.73 | \n", "16.0 | \n", "0.0 | \n", "0.0 | \n", "
| 4 | \n", "33 | \n", "Desmopressin | \n", "solid | \n", "H01BA | \n", "H01B | \n", "H01 | \n", "H | \n", "1069.2200 | \n", "-6.10 | \n", "0.11000 | \n", "... | \n", "19.0 | \n", "435.41 | \n", "11.77 | \n", "0.0 | \n", "1068.426956 | \n", "1.0 | \n", "104.78 | \n", "15.0 | \n", "1.0 | \n", "0.0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2625 | \n", "14553 | \n", "Belumosudil | \n", "solid | \n", "L04AA | \n", "L04A | \n", "L04 | \n", "L | \n", "452.5180 | \n", "4.65 | \n", "0.00289 | \n", "... | \n", "7.0 | \n", "104.82 | \n", "4.11 | \n", "0.0 | \n", "452.196074 | \n", "1.0 | \n", "49.55 | \n", "6.0 | \n", "0.0 | \n", "1.0 | \n", "
| 2626 | \n", "14688 | \n", "Tebipenem pivoxil | \n", "NaN | \n", "J01DH | \n", "J01D | \n", "J01 | \n", "J | \n", "497.6300 | \n", "1.59 | \n", "0.16700 | \n", "... | \n", "9.0 | \n", "108.74 | \n", "6.27 | \n", "0.0 | \n", "497.165428 | \n", "1.0 | \n", "53.39 | \n", "6.0 | \n", "0.0 | \n", "1.0 | \n", "
| 2627 | \n", "14698 | \n", "Tosufloxacin | \n", "NaN | \n", "J01MA | \n", "J01M | \n", "J01 | \n", "J | \n", "404.3490 | \n", "0.47 | \n", "0.07620 | \n", "... | \n", "3.0 | \n", "99.76 | \n", "9.80 | \n", "1.0 | \n", "404.109625 | \n", "0.0 | \n", "37.18 | \n", "7.0 | \n", "0.0 | \n", "1.0 | \n", "
| 2628 | \n", "14931 | \n", "Linzagolix | \n", "solid | \n", "H01CC | \n", "H01C | \n", "H01 | \n", "H | \n", "508.4200 | \n", "3.88 | \n", "0.00198 | \n", "... | \n", "6.0 | \n", "114.40 | \n", "-3.50 | \n", "0.0 | \n", "508.055206 | \n", "1.0 | \n", "45.39 | \n", "7.0 | \n", "-1.0 | \n", "0.0 | \n", "
| 2629 | \n", "14995 | \n", "Methionine C-11 | \n", "NaN | \n", "V09IX | \n", "V09I | \n", "V09 | \n", "V | \n", "148.2100 | \n", "-2.20 | \n", "23.90000 | \n", "... | \n", "4.0 | \n", "63.32 | \n", "9.50 | \n", "0.0 | \n", "148.062484 | \n", "0.0 | \n", "15.54 | \n", "3.0 | \n", "0.0 | \n", "1.0 | \n", "
2630 rows × 26 columns
\n", "| name | \n", "Bivalirudin | \n", "Leuprolide | \n", "Goserelin | \n", "Gramicidin D | \n", "Desmopressin | \n", "Cetrorelix | \n", "Daptomycin | \n", "Abarelix | \n", "Pyridoxal phosphate | \n", "Cyanocobalamin | \n", "... | \n", "Naphthoquine | \n", "Odevixibat | \n", "Melphalan flufenamide | \n", "Deucravacitinib | \n", "Tegoprazan | \n", "Belumosudil | \n", "Tebipenem pivoxil | \n", "Tosufloxacin | \n", "Linzagolix | \n", "Methionine C-11 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| name | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
| Bivalirudin | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Leuprolide | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Goserelin | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Gramicidin D | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Desmopressin | \n", "0 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "1 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| Belumosudil | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Tebipenem pivoxil | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Tosufloxacin | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Linzagolix | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
| Methionine C-11 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "... | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "
2630 rows × 2630 columns
\n", "| name | \n", "Bivalirudin | \n", "Leuprolide | \n", "Goserelin | \n", "Gramicidin D | \n", "Desmopressin | \n", "Cetrorelix | \n", "Daptomycin | \n", "Abarelix | \n", "Pyridoxal phosphate | \n", "Cyanocobalamin | \n", "... | \n", "Naphthoquine | \n", "Odevixibat | \n", "Melphalan flufenamide | \n", "Deucravacitinib | \n", "Tegoprazan | \n", "Belumosudil | \n", "Tebipenem pivoxil | \n", "Tosufloxacin | \n", "Linzagolix | \n", "Methionine C-11 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "1.000000 | \n", "0.306150 | \n", "0.288741 | \n", "0.083090 | \n", "0.310237 | \n", "0.0 | \n", "0.338457 | \n", "0.0 | \n", "0.0 | \n", "0.430352 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.305532 | \n", "0.0 | \n", "0.241866 | \n", "0.0 | \n", "0.0 | \n", "0.105519 | \n", "0.0 | \n", "
| 1 | \n", "0.306150 | \n", "1.000000 | \n", "0.780471 | \n", "0.087487 | \n", "0.587482 | \n", "0.0 | \n", "0.645092 | \n", "0.0 | \n", "0.0 | \n", "0.601979 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.167036 | \n", "0.0 | \n", "0.242198 | \n", "0.0 | \n", "0.0 | \n", "0.156851 | \n", "0.0 | \n", "
| 2 | \n", "0.288741 | \n", "0.780471 | \n", "1.000000 | \n", "0.110648 | \n", "0.603694 | \n", "0.0 | \n", "0.614604 | \n", "0.0 | \n", "0.0 | \n", "0.608478 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.123966 | \n", "0.0 | \n", "0.217510 | \n", "0.0 | \n", "0.0 | \n", "0.123984 | \n", "0.0 | \n", "
| 3 | \n", "0.083090 | \n", "0.087487 | \n", "0.110648 | \n", "1.000000 | \n", "0.028047 | \n", "0.0 | \n", "0.190443 | \n", "0.0 | \n", "0.0 | \n", "0.032498 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.039841 | \n", "0.0 | \n", "
| 4 | \n", "0.310237 | \n", "0.587482 | \n", "0.603694 | \n", "0.028047 | \n", "1.000000 | \n", "0.0 | \n", "0.563808 | \n", "0.0 | \n", "0.0 | \n", "0.630617 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.099909 | \n", "0.0 | \n", "0.178126 | \n", "0.0 | \n", "0.0 | \n", "0.087996 | \n", "0.0 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2625 | \n", "0.241866 | \n", "0.242198 | \n", "0.217510 | \n", "0.000000 | \n", "0.178126 | \n", "0.0 | \n", "0.343441 | \n", "0.0 | \n", "0.0 | \n", "0.270278 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.523597 | \n", "0.0 | \n", "1.000000 | \n", "0.0 | \n", "0.0 | \n", "0.186761 | \n", "0.0 | \n", "
| 2626 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "
| 2627 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "
| 2628 | \n", "0.105519 | \n", "0.156851 | \n", "0.123984 | \n", "0.039841 | \n", "0.087996 | \n", "0.0 | \n", "0.164395 | \n", "0.0 | \n", "0.0 | \n", "0.097106 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.082406 | \n", "0.0 | \n", "0.186761 | \n", "0.0 | \n", "0.0 | \n", "1.000000 | \n", "0.0 | \n", "
| 2629 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "0.0 | \n", "0.000000 | \n", "0.0 | \n", "
2630 rows × 2630 columns
\n", "