{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "e15ff842", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import numpy as np\n", "import matplotlib.pyplot as plt\n", "import warnings\n", "import plotly.offline as py\n", "# py.init_notebook_mode(connected=True)\n", "import plotly.graph_objs as go\n", "import plotly.tools as tls\n", "import plotly.figure_factory as ff\n", "import seaborn as sns\n", "# warnings.filterwarnings('ignore') #ignore warning messages" ] }, { "cell_type": "code", "execution_count": 2, "id": "cf08041d", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | ID | \n", "pCR (outcome) | \n", "RelapseFreeSurvival (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "... | \n", "original_glszm_SmallAreaHighGrayLevelEmphasis | \n", "original_glszm_SmallAreaLowGrayLevelEmphasis | \n", "original_glszm_ZoneEntropy | \n", "original_glszm_ZonePercentage | \n", "original_glszm_ZoneVariance | \n", "original_ngtdm_Busyness | \n", "original_ngtdm_Coarseness | \n", "original_ngtdm_Complexity | \n", "original_ngtdm_Contrast | \n", "original_ngtdm_Strength | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
395 | \n", "TRG002948 | \n", "0 | \n", "54.500000 | \n", "58.5 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "3 | \n", "2 | \n", "... | \n", "0.476493 | \n", "0.476493 | \n", "2.453583 | \n", "0.003229 | \n", "2.327038e+06 | \n", "18.562377 | \n", "0.013766 | \n", "0.018042 | \n", "0.000288 | \n", "0.012257 | \n", "
396 | \n", "TRG002954 | \n", "0 | \n", "49.250000 | \n", "34.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "... | \n", "0.418382 | \n", "0.418382 | \n", "2.995603 | \n", "0.004243 | \n", "1.005061e+06 | \n", "156.627179 | \n", "0.002228 | \n", "0.136015 | \n", "0.022148 | \n", "0.002098 | \n", "
397 | \n", "TRG002958 | \n", "0 | \n", "48.500000 | \n", "53.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "... | \n", "0.527779 | \n", "0.527778 | \n", "1.500000 | \n", "0.003728 | \n", "2.132007e+05 | \n", "0.996746 | \n", "0.252582 | \n", "0.007380 | \n", "0.000037 | \n", "0.231059 | \n", "
398 | \n", "TRG002961 | \n", "0 | \n", "47.500000 | \n", "68.8 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "... | \n", "0.313693 | \n", "0.313693 | \n", "3.573557 | \n", "0.001112 | \n", "2.008034e+07 | \n", "204.864200 | \n", "0.001372 | \n", "0.054063 | \n", "0.003697 | \n", "0.001368 | \n", "
399 | \n", "TRG002962 | \n", "0 | \n", "46.916667 | \n", "46.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "... | \n", "0.670229 | \n", "0.670229 | \n", "1.857045 | \n", "0.006706 | \n", "5.609262e+05 | \n", "9.609163 | \n", "0.026591 | \n", "0.018682 | \n", "0.000311 | \n", "0.022676 | \n", "
5 rows × 120 columns
\n", "\n", " | pCR (outcome) | \n", "RelapseFreeSurvival (outcome) | \n", "
---|---|---|
count | \n", "400.000000 | \n", "400.000000 | \n", "
mean | \n", "12.697500 | \n", "56.000208 | \n", "
std | \n", "111.107417 | \n", "27.137584 | \n", "
min | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "0.000000 | \n", "38.000000 | \n", "
50% | \n", "0.000000 | \n", "55.000000 | \n", "
75% | \n", "0.000000 | \n", "73.000000 | \n", "
max | \n", "999.000000 | \n", "144.000000 | \n", "
\n", " | pCR (outcome) | \n", "RelapseFreeSurvival (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "144.000000 | \n", "41.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "
1 | \n", "0 | \n", "142.000000 | \n", "39.0 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "
2 | \n", "1 | \n", "135.000000 | \n", "31.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "
3 | \n", "0 | \n", "12.000000 | \n", "35.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "
4 | \n", "0 | \n", "109.000000 | \n", "61.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
395 | \n", "0 | \n", "54.500000 | \n", "58.5 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "3 | \n", "2 | \n", "1 | \n", "1 | \n", "4 | \n", "
396 | \n", "0 | \n", "49.250000 | \n", "34.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "0 | \n", "2 | \n", "
397 | \n", "0 | \n", "48.500000 | \n", "53.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "
398 | \n", "0 | \n", "47.500000 | \n", "68.8 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "
399 | \n", "0 | \n", "46.916667 | \n", "46.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "1 | \n", "2 | \n", "
400 rows × 12 columns
\n", "\n", " | pCR (outcome) | \n", "RelapseFreeSurvival (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "
mean | \n", "0.210000 | \n", "56.000208 | \n", "51.804674 | \n", "0.547500 | \n", "0.405000 | \n", "0.300000 | \n", "0.332500 | \n", "2.397500 | \n", "1.572500 | \n", "1.147500 | \n", "0.535000 | \n", "2.607500 | \n", "
std | \n", "0.407818 | \n", "27.137584 | \n", "10.948522 | \n", "0.498362 | \n", "0.491507 | \n", "0.458831 | \n", "0.471699 | \n", "0.500119 | \n", "0.765643 | \n", "0.355048 | \n", "0.499398 | \n", "0.897473 | \n", "
min | \n", "0.000000 | \n", "0.000000 | \n", "23.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "1.000000 | \n", "
25% | \n", "0.000000 | \n", "38.000000 | \n", "44.516769 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "2.000000 | \n", "
50% | \n", "0.000000 | \n", "55.000000 | \n", "51.019507 | \n", "1.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "2.000000 | \n", "
75% | \n", "0.000000 | \n", "73.000000 | \n", "60.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "
max | \n", "1.000000 | \n", "144.000000 | \n", "79.603012 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "4.000000 | \n", "
\n", " | pCR (outcome) | \n", "RelapseFreeSurvival (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "... | \n", "original_glszm_SmallAreaHighGrayLevelEmphasis | \n", "original_glszm_SmallAreaLowGrayLevelEmphasis | \n", "original_glszm_ZoneEntropy | \n", "original_glszm_ZonePercentage | \n", "original_glszm_ZoneVariance | \n", "original_ngtdm_Busyness | \n", "original_ngtdm_Coarseness | \n", "original_ngtdm_Complexity | \n", "original_ngtdm_Contrast | \n", "original_ngtdm_Strength | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "... | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "400.000000 | \n", "4.000000e+02 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "
mean | \n", "0.210000 | \n", "56.000208 | \n", "51.804674 | \n", "0.547500 | \n", "0.405000 | \n", "0.300000 | \n", "0.332500 | \n", "2.397500 | \n", "1.572500 | \n", "1.147500 | \n", "... | \n", "3.957637e-01 | \n", "3.911005e-01 | \n", "2.722189e+00 | \n", "0.003347 | \n", "5.679717e+07 | \n", "178.311246 | \n", "32500.032620 | \n", "0.056935 | \n", "0.005965 | \n", "0.029322 | \n", "
std | \n", "0.407818 | \n", "27.137584 | \n", "10.948522 | \n", "0.498362 | \n", "0.491507 | \n", "0.458831 | \n", "0.471699 | \n", "0.500119 | \n", "0.765643 | \n", "0.355048 | \n", "... | \n", "1.666319e-01 | \n", "1.615922e-01 | \n", "7.648849e-01 | \n", "0.002419 | \n", "7.063846e+08 | \n", "1045.453432 | \n", "177545.921568 | \n", "0.047179 | \n", "0.008379 | \n", "0.115915 | \n", "
min | \n", "0.000000 | \n", "0.000000 | \n", "23.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "... | \n", "7.050000e-11 | \n", "7.050000e-11 | \n", "-3.200000e-16 | \n", "0.000008 | \n", "0.000000e+00 | \n", "0.000000 | \n", "0.000248 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "
25% | \n", "0.000000 | \n", "38.000000 | \n", "44.516769 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "... | \n", "3.199017e-01 | \n", "3.184398e-01 | \n", "2.340783e+00 | \n", "0.001389 | \n", "1.030473e+06 | \n", "18.760570 | \n", "0.001826 | \n", "0.018628 | \n", "0.000310 | \n", "0.001464 | \n", "
50% | \n", "0.000000 | \n", "55.000000 | \n", "51.019507 | \n", "1.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "... | \n", "4.095627e-01 | \n", "4.054695e-01 | \n", "2.814884e+00 | \n", "0.002944 | \n", "3.277334e+06 | \n", "67.929659 | \n", "0.004383 | \n", "0.047740 | \n", "0.002330 | \n", "0.003276 | \n", "
75% | \n", "0.000000 | \n", "73.000000 | \n", "60.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "... | \n", "5.000049e-01 | \n", "4.956920e-01 | \n", "3.304411e+00 | \n", "0.004798 | \n", "9.079686e+06 | \n", "157.370294 | \n", "0.013769 | \n", "0.085321 | \n", "0.007962 | \n", "0.009479 | \n", "
max | \n", "1.000000 | \n", "144.000000 | \n", "79.603012 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.000000 | \n", "2.000000 | \n", "... | \n", "8.773779e-01 | \n", "8.571429e-01 | \n", "4.947427e+00 | \n", "0.011301 | \n", "1.390001e+10 | \n", "20764.693790 | \n", "1000000.000000 | \n", "0.285100 | \n", "0.060742 | \n", "1.145601 | \n", "
8 rows × 119 columns
\n", "\n", " | pCR (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "0 | \n", "1 | \n", "2 | \n", "3 | \n", "4 | \n", "5 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "41.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "12.596187 | \n", "1.476490 | \n", "0.835322 | \n", "3.572652 | \n", "3.680844 | \n", "1.588340 | \n", "
1 | \n", "0 | \n", "39.0 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "-3.402929 | \n", "-1.950037 | \n", "-1.825297 | \n", "1.893426 | \n", "-1.392585 | \n", "0.782602 | \n", "
2 | \n", "1 | \n", "31.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-3.831085 | \n", "-2.983421 | \n", "-2.157645 | \n", "2.095281 | \n", "-0.686464 | \n", "2.161302 | \n", "
3 | \n", "0 | \n", "35.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "-6.312342 | \n", "-1.559572 | \n", "-1.819064 | \n", "2.526369 | \n", "-0.793346 | \n", "0.518627 | \n", "
4 | \n", "0 | \n", "61.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-2.275703 | \n", "-3.647228 | \n", "-2.008927 | \n", "3.357714 | \n", "-0.870179 | \n", "2.050370 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
395 | \n", "0 | \n", "58.5 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "3 | \n", "2 | \n", "1 | \n", "1 | \n", "4 | \n", "-4.421618 | \n", "-3.627292 | \n", "-0.807734 | \n", "0.431116 | \n", "0.401040 | \n", "0.350318 | \n", "
396 | \n", "0 | \n", "34.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "0 | \n", "2 | \n", "10.765770 | \n", "1.886069 | \n", "0.430573 | \n", "-0.233894 | \n", "-0.328621 | \n", "0.065289 | \n", "
397 | \n", "0 | \n", "53.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-2.991509 | \n", "-5.684329 | \n", "-0.548646 | \n", "-6.053106 | \n", "3.533711 | \n", "1.468567 | \n", "
398 | \n", "0 | \n", "68.8 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "0.371324 | \n", "0.799043 | \n", "0.445663 | \n", "5.795988 | \n", "0.859414 | \n", "-2.789871 | \n", "
399 | \n", "0 | \n", "46.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "1 | \n", "2 | \n", "-2.744353 | \n", "-4.132731 | \n", "-1.735130 | \n", "-4.106370 | \n", "-0.757445 | \n", "2.916702 | \n", "
400 rows × 17 columns
\n", "\n", " | pCR (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "COMP0 | \n", "COMP1 | \n", "COMP2 | \n", "COMP3 | \n", "COMP4 | \n", "COMP5 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "41.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "12.596187 | \n", "1.476490 | \n", "0.835322 | \n", "3.572652 | \n", "3.680844 | \n", "1.588340 | \n", "
1 | \n", "0 | \n", "39.0 | \n", "1 | \n", "1 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "2 | \n", "-3.402929 | \n", "-1.950037 | \n", "-1.825297 | \n", "1.893426 | \n", "-1.392585 | \n", "0.782602 | \n", "
2 | \n", "1 | \n", "31.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-3.831085 | \n", "-2.983421 | \n", "-2.157645 | \n", "2.095281 | \n", "-0.686464 | \n", "2.161302 | \n", "
3 | \n", "0 | \n", "35.0 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "-6.312342 | \n", "-1.559572 | \n", "-1.819064 | \n", "2.526369 | \n", "-0.793346 | \n", "0.518627 | \n", "
4 | \n", "0 | \n", "61.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-2.275703 | \n", "-3.647228 | \n", "-2.008927 | \n", "3.357714 | \n", "-0.870179 | \n", "2.050370 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
395 | \n", "0 | \n", "58.5 | \n", "1 | \n", "0 | \n", "1 | \n", "0 | \n", "3 | \n", "2 | \n", "1 | \n", "1 | \n", "4 | \n", "-4.421618 | \n", "-3.627292 | \n", "-0.807734 | \n", "0.431116 | \n", "0.401040 | \n", "0.350318 | \n", "
396 | \n", "0 | \n", "34.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "3 | \n", "3 | \n", "1 | \n", "0 | \n", "2 | \n", "10.765770 | \n", "1.886069 | \n", "0.430573 | \n", "-0.233894 | \n", "-0.328621 | \n", "0.065289 | \n", "
397 | \n", "0 | \n", "53.3 | \n", "0 | \n", "0 | \n", "0 | \n", "1 | \n", "2 | \n", "1 | \n", "1 | \n", "0 | \n", "2 | \n", "-2.991509 | \n", "-5.684329 | \n", "-0.548646 | \n", "-6.053106 | \n", "3.533711 | \n", "1.468567 | \n", "
398 | \n", "0 | \n", "68.8 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "3 | \n", "3 | \n", "1 | \n", "1 | \n", "3 | \n", "0.371324 | \n", "0.799043 | \n", "0.445663 | \n", "5.795988 | \n", "0.859414 | \n", "-2.789871 | \n", "
399 | \n", "0 | \n", "46.0 | \n", "1 | \n", "0 | \n", "0 | \n", "0 | \n", "2 | \n", "1 | \n", "1 | \n", "1 | \n", "2 | \n", "-2.744353 | \n", "-4.132731 | \n", "-1.735130 | \n", "-4.106370 | \n", "-0.757445 | \n", "2.916702 | \n", "
400 rows × 17 columns
\n", "\n", " | pCR (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "COMP0 | \n", "COMP1 | \n", "COMP2 | \n", "COMP3 | \n", "COMP4 | \n", "COMP5 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "
mean | \n", "0.210000 | \n", "51.804674 | \n", "0.547500 | \n", "0.405000 | \n", "0.300000 | \n", "0.332500 | \n", "2.397500 | \n", "1.572500 | \n", "1.147500 | \n", "0.535000 | \n", "2.607500 | \n", "1.421085e-16 | \n", "-3.552714e-17 | \n", "-8.437695e-17 | \n", "-1.065814e-16 | \n", "1.776357e-17 | \n", "-3.552714e-17 | \n", "
std | \n", "0.407818 | \n", "10.948522 | \n", "0.498362 | \n", "0.491507 | \n", "0.458831 | \n", "0.471699 | \n", "0.500119 | \n", "0.765643 | \n", "0.355048 | \n", "0.499398 | \n", "0.897473 | \n", "5.913835e+00 | \n", "3.956354e+00 | \n", "3.625338e+00 | \n", "3.498424e+00 | \n", "2.576519e+00 | \n", "2.271563e+00 | \n", "
min | \n", "0.000000 | \n", "23.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "1.000000 | \n", "-2.137126e+01 | \n", "-7.155386e+00 | \n", "-3.817510e+00 | \n", "-1.234668e+01 | \n", "-6.612577e+00 | \n", "-1.025440e+01 | \n", "
25% | \n", "0.000000 | \n", "44.516769 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "2.000000 | \n", "-4.380918e+00 | \n", "-2.300239e+00 | \n", "-1.501204e+00 | \n", "-2.016138e+00 | \n", "-1.603999e+00 | \n", "-1.087117e+00 | \n", "
50% | \n", "0.000000 | \n", "51.019507 | \n", "1.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "2.000000 | \n", "-6.291532e-01 | \n", "-4.220578e-01 | \n", "-7.452754e-01 | \n", "3.711719e-01 | \n", "-2.808058e-01 | \n", "-3.972333e-02 | \n", "
75% | \n", "0.000000 | \n", "60.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.844593e+00 | \n", "1.489531e+00 | \n", "1.908735e-01 | \n", "2.303221e+00 | \n", "1.190874e+00 | \n", "1.120237e+00 | \n", "
max | \n", "1.000000 | \n", "79.603012 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "4.000000 | \n", "2.246977e+01 | \n", "4.495662e+01 | \n", "2.031779e+01 | \n", "1.283187e+01 | \n", "1.878213e+01 | \n", "2.207831e+01 | \n", "
\n", " | pCR (outcome) | \n", "Age | \n", "ER | \n", "PgR | \n", "HER2 | \n", "TrippleNegative | \n", "ChemoGrade | \n", "Proliferation | \n", "HistologyType | \n", "LNStatus | \n", "TumourStage | \n", "COMP0 | \n", "COMP1 | \n", "COMP2 | \n", "COMP3 | \n", "COMP4 | \n", "COMP5 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
count | \n", "400.000000 | \n", "4.000000e+02 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "400.000000 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "4.000000e+02 | \n", "
mean | \n", "0.210000 | \n", "-9.325873e-17 | \n", "0.547500 | \n", "0.405000 | \n", "0.300000 | \n", "0.332500 | \n", "2.397500 | \n", "1.572500 | \n", "1.147500 | \n", "0.535000 | \n", "2.607500 | \n", "1.421085e-16 | \n", "-3.552714e-17 | \n", "-8.437695e-17 | \n", "-1.065814e-16 | \n", "1.776357e-17 | \n", "-3.552714e-17 | \n", "
std | \n", "0.407818 | \n", "1.001252e+00 | \n", "0.498362 | \n", "0.491507 | \n", "0.458831 | \n", "0.471699 | \n", "0.500119 | \n", "0.765643 | \n", "0.355048 | \n", "0.499398 | \n", "0.897473 | \n", "5.913835e+00 | \n", "3.956354e+00 | \n", "3.625338e+00 | \n", "3.498424e+00 | \n", "2.576519e+00 | \n", "2.271563e+00 | \n", "
min | \n", "0.000000 | \n", "-2.634214e+00 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "1.000000 | \n", "-2.137126e+01 | \n", "-7.155386e+00 | \n", "-3.817510e+00 | \n", "-1.234668e+01 | \n", "-6.612577e+00 | \n", "-1.025440e+01 | \n", "
25% | \n", "0.000000 | \n", "-6.664855e-01 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "0.000000 | \n", "2.000000 | \n", "-4.380918e+00 | \n", "-2.300239e+00 | \n", "-1.501204e+00 | \n", "-2.016138e+00 | \n", "-1.603999e+00 | \n", "-1.087117e+00 | \n", "
50% | \n", "0.000000 | \n", "-7.180426e-02 | \n", "1.000000 | \n", "0.000000 | \n", "0.000000 | \n", "0.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "2.000000 | \n", "-6.291532e-01 | \n", "-4.220578e-01 | \n", "-7.452754e-01 | \n", "3.711719e-01 | \n", "-2.808058e-01 | \n", "-3.972333e-02 | \n", "
75% | \n", "0.000000 | \n", "7.494700e-01 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.844593e+00 | \n", "1.489531e+00 | \n", "1.908735e-01 | \n", "2.303221e+00 | \n", "1.190874e+00 | \n", "1.120237e+00 | \n", "
max | \n", "1.000000 | \n", "2.542183e+00 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "1.000000 | \n", "3.000000 | \n", "3.000000 | \n", "2.000000 | \n", "1.000000 | \n", "4.000000 | \n", "2.246977e+01 | \n", "4.495662e+01 | \n", "2.031779e+01 | \n", "1.283187e+01 | \n", "1.878213e+01 | \n", "2.207831e+01 | \n", "
XGBClassifier(base_score=None, booster='gbtree', callbacks=None,\n", " colsample_bylevel=None, colsample_bynode=None,\n", " colsample_bytree=0.4, device=None, early_stopping_rounds=None,\n", " enable_categorical=False, eval_metric=None, feature_types=None,\n", " gamma=0.1, grow_policy=None, importance_type=None,\n", " interaction_constraints=None, learning_rate=0.05, max_bin=None,\n", " max_cat_threshold=None, max_cat_to_onehot=None,\n", " max_delta_step=None, max_depth=10, max_leaves=None,\n", " min_child_weight=1, missing=nan, monotone_constraints=None,\n", " multi_strategy=None, n_estimators=None, n_jobs=None,\n", " num_parallel_tree=None, random_state=None, ...)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
XGBClassifier(base_score=None, booster='gbtree', callbacks=None,\n", " colsample_bylevel=None, colsample_bynode=None,\n", " colsample_bytree=0.4, device=None, early_stopping_rounds=None,\n", " enable_categorical=False, eval_metric=None, feature_types=None,\n", " gamma=0.1, grow_policy=None, importance_type=None,\n", " interaction_constraints=None, learning_rate=0.05, max_bin=None,\n", " max_cat_threshold=None, max_cat_to_onehot=None,\n", " max_delta_step=None, max_depth=10, max_leaves=None,\n", " min_child_weight=1, missing=nan, monotone_constraints=None,\n", " multi_strategy=None, n_estimators=None, n_jobs=None,\n", " num_parallel_tree=None, random_state=None, ...)
XGBClassifier(base_score=None, booster='gbtree', callbacks=None,\n", " colsample_bylevel=None, colsample_bynode=None,\n", " colsample_bytree=0.4, device=None, early_stopping_rounds=None,\n", " enable_categorical=False, eval_metric=None, feature_types=None,\n", " gamma=0.1, grow_policy=None, importance_type=None,\n", " interaction_constraints=None, learning_rate=0.05, max_bin=None,\n", " max_cat_threshold=None, max_cat_to_onehot=None,\n", " max_delta_step=None, max_depth=10, max_leaves=None,\n", " min_child_weight=1, missing=nan, monotone_constraints=None,\n", " multi_strategy=None, n_estimators=None, n_jobs=None,\n", " num_parallel_tree=None, random_state=None, ...)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
XGBClassifier(base_score=None, booster='gbtree', callbacks=None,\n", " colsample_bylevel=None, colsample_bynode=None,\n", " colsample_bytree=0.4, device=None, early_stopping_rounds=None,\n", " enable_categorical=False, eval_metric=None, feature_types=None,\n", " gamma=0.1, grow_policy=None, importance_type=None,\n", " interaction_constraints=None, learning_rate=0.05, max_bin=None,\n", " max_cat_threshold=None, max_cat_to_onehot=None,\n", " max_delta_step=None, max_depth=10, max_leaves=None,\n", " min_child_weight=1, missing=nan, monotone_constraints=None,\n", " multi_strategy=None, n_estimators=None, n_jobs=None,\n", " num_parallel_tree=None, random_state=None, ...)
LGBMClassifier()In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LGBMClassifier()
LogisticRegression(max_iter=500)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
LogisticRegression(max_iter=500)
SVC(gamma=0.1)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
SVC(gamma=0.1)
SVC(gamma=0.1)In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
SVC(gamma=0.1)