Learning BN as probabilistic classifier

Learning a Bayesian network can be used to obtain a classifier for one of the nodes of the model. For more about classifier, see pyagrum.skbn.

Creative Commons License

aGrUM

interactive online version

In [1]:
import pyagrum as gum
import pyagrum.lib.notebook as gnb

%matplotlib inline
from pyagrum.lib.bn2roc import showROC
from pyagrum.lib.bn2roc import showPR
from pyagrum.lib.bn2roc import showROC_PR

SIZE_LEARN = 10000
SIZE_VALID = 2000
In [2]:
bn = gum.loadBN("res/alarm.dsl")
bn
Out[2]:
G HREKG HREKG LVFAILURE LVFAILURE LVEDVOLUME LVEDVOLUME LVFAILURE->LVEDVOLUME STROKEVOLUME STROKEVOLUME LVFAILURE->STROKEVOLUME HISTORY HISTORY LVFAILURE->HISTORY DISCONNECT DISCONNECT VENTTUBE VENTTUBE DISCONNECT->VENTTUBE PVSAT PVSAT SAO2 SAO2 PVSAT->SAO2 CVP CVP LVEDVOLUME->CVP PCWP PCWP LVEDVOLUME->PCWP HYPOVOLEMIA HYPOVOLEMIA HYPOVOLEMIA->LVEDVOLUME HYPOVOLEMIA->STROKEVOLUME INSUFFANESTH INSUFFANESTH CATECHOL CATECHOL INSUFFANESTH->CATECHOL ERRCAUTER ERRCAUTER ERRCAUTER->HREKG HRSAT HRSAT ERRCAUTER->HRSAT ERRLOWOUTPUT ERRLOWOUTPUT HRBP HRBP ERRLOWOUTPUT->HRBP VENTMACH VENTMACH VENTMACH->VENTTUBE HR HR HR->HREKG CO CO HR->CO HR->HRBP HR->HRSAT STROKEVOLUME->CO BP BP PULMEMBOLUS PULMEMBOLUS PAP PAP PULMEMBOLUS->PAP SHUNT SHUNT PULMEMBOLUS->SHUNT PRESS PRESS VENTTUBE->PRESS VENTLUNG VENTLUNG VENTTUBE->VENTLUNG INTUBATION INTUBATION MINVOL MINVOL INTUBATION->MINVOL INTUBATION->SHUNT VENTALV VENTALV INTUBATION->VENTALV INTUBATION->PRESS INTUBATION->VENTLUNG TPR TPR TPR->BP TPR->CATECHOL CATECHOL->HR EXPCO2 EXPCO2 ANAPHYLAXIS ANAPHYLAXIS ANAPHYLAXIS->TPR CO->BP ARTCO2 ARTCO2 ARTCO2->CATECHOL ARTCO2->EXPCO2 KINKEDTUBE KINKEDTUBE KINKEDTUBE->PRESS KINKEDTUBE->VENTLUNG SHUNT->SAO2 SAO2->CATECHOL VENTALV->PVSAT VENTALV->ARTCO2 VENTLUNG->EXPCO2 VENTLUNG->MINVOL VENTLUNG->VENTALV FIO2 FIO2 FIO2->PVSAT MINVOLSET MINVOLSET MINVOLSET->VENTMACH
In [3]:
gum.generateSample(bn, SIZE_LEARN, "out/learn.csv", show_progress=True, with_labels=True)
gum.generateSample(bn, SIZE_VALID, "out/train.csv", show_progress=True, with_labels=True)
out/learn.csv: 100%|███████████████████████████████████████|
Log2-Likelihood : -152316.03720553295
out/train.csv: 100%|███████████████████████████████████████|
Log2-Likelihood : -30134.285305805093

Out[3]:
-30134.285305805093

Learning a BN from learn.csv

In [4]:
# Learning a BN from the database
learner = gum.BNLearner("out/train.csv")

bn2 = learner.useMIIC().learnBN()
currentTime = learner.currentTime()
In [5]:
gnb.flow.add(gnb.getBN(bn2, size="9"), f"Learned with {SIZE_LEARN} lines in {currentTime:.3f}s")
gnb.flow.display()
G HREKG HREKG HRSAT HRSAT HREKG->HRSAT LVFAILURE LVFAILURE LVEDVOLUME LVEDVOLUME LVFAILURE->LVEDVOLUME STROKEVOLUME STROKEVOLUME LVFAILURE->STROKEVOLUME PVSAT PVSAT SAO2 SAO2 PVSAT->SAO2 FIO2 FIO2 PVSAT->FIO2 DISCONNECT DISCONNECT VENTTUBE VENTTUBE DISCONNECT->VENTTUBE CVP CVP LVEDVOLUME->CVP PCWP PCWP LVEDVOLUME->PCWP HYPOVOLEMIA HYPOVOLEMIA HYPOVOLEMIA->LVEDVOLUME HYPOVOLEMIA->STROKEVOLUME INSUFFANESTH INSUFFANESTH ERRCAUTER ERRCAUTER ERRCAUTER->HREKG ERRCAUTER->HRSAT ERRLOWOUTPUT ERRLOWOUTPUT HRBP HRBP ERRLOWOUTPUT->HRBP BP BP HR HR HR->HREKG CO CO HR->CO HR->HRBP HR->HRSAT VENTMACH VENTMACH VENTMACH->VENTTUBE STROKEVOLUME->CO HISTORY HISTORY HISTORY->LVFAILURE PULMEMBOLUS PULMEMBOLUS SHUNT SHUNT PULMEMBOLUS->SHUNT PRESS PRESS VENTTUBE->PRESS VENTLUNG VENTLUNG VENTTUBE->VENTLUNG INTUBATION INTUBATION INTUBATION->SHUNT INTUBATION->PRESS TPR TPR TPR->BP CATECHOL CATECHOL CATECHOL->HR EXPCO2 EXPCO2 ARTCO2 ARTCO2 EXPCO2->ARTCO2 ANAPHYLAXIS ANAPHYLAXIS ANAPHYLAXIS->TPR CO->BP VENTALV VENTALV ARTCO2->VENTALV MINVOL MINVOL KINKEDTUBE KINKEDTUBE KINKEDTUBE->PRESS KINKEDTUBE->VENTLUNG SHUNT->STROKEVOLUME SHUNT->SAO2 PAP PAP PAP->PULMEMBOLUS SAO2->CATECHOL VENTALV->PVSAT VENTALV->INTUBATION VENTALV->MINVOL VENTLUNG->EXPCO2 VENTLUNG->VENTALV MINVOLSET MINVOLSET MINVOLSET->VENTMACH
Learned with 10000 lines in 0.254s
In [6]:
import pyagrum.lib.bn_vs_bn as bnvsbn

gnb.flow.add(gnb.getBNDiff(bn, bn2, size="8!"), "Diff with MIIC")
gnb.flow.add(bnvsbn.graphDiffLegend())
gnb.flow.display()
G KINKEDTUBE KINKEDTUBE VENTLUNG VENTLUNG KINKEDTUBE->VENTLUNG PRESS PRESS KINKEDTUBE->PRESS HYPOVOLEMIA HYPOVOLEMIA STROKEVOLUME STROKEVOLUME HYPOVOLEMIA->STROKEVOLUME LVEDVOLUME LVEDVOLUME HYPOVOLEMIA->LVEDVOLUME INTUBATION INTUBATION SHUNT SHUNT INTUBATION->SHUNT INTUBATION->VENTLUNG MINVOL MINVOL INTUBATION->MINVOL INTUBATION->PRESS VENTALV VENTALV MINVOLSET MINVOLSET VENTMACH VENTMACH MINVOLSET->VENTMACH PULMEMBOLUS PULMEMBOLUS PAP PAP PULMEMBOLUS->SHUNT INSUFFANESTH INSUFFANESTH CATECHOL CATECHOL INSUFFANESTH->CATECHOL ERRLOWOUTPUT ERRLOWOUTPUT HRBP HRBP ERRLOWOUTPUT->HRBP ERRCAUTER ERRCAUTER HRSAT HRSAT ERRCAUTER->HRSAT HREKG HREKG ERRCAUTER->HREKG FIO2 FIO2 PVSAT PVSAT LVFAILURE LVFAILURE LVFAILURE->STROKEVOLUME LVFAILURE->LVEDVOLUME HISTORY HISTORY DISCONNECT DISCONNECT VENTTUBE VENTTUBE DISCONNECT->VENTTUBE ANAPHYLAXIS ANAPHYLAXIS TPR TPR ANAPHYLAXIS->TPR PAP->PULMEMBOLUS CO CO STROKEVOLUME->CO TPR->CATECHOL BP BP TPR->BP PCWP PCWP LVEDVOLUME->PCWP CVP CVP LVEDVOLUME->CVP VENTMACH->VENTTUBE SHUNT->STROKEVOLUME SAO2 SAO2 SHUNT->SAO2 HISTORY->LVFAILURE VENTTUBE->VENTLUNG VENTTUBE->PRESS VENTLUNG->MINVOL VENTLUNG->VENTALV EXPCO2 EXPCO2 VENTLUNG->EXPCO2 VENTALV->INTUBATION VENTALV->MINVOL ARTCO2 ARTCO2 VENTALV->PVSAT ARTCO2->VENTALV ARTCO2->CATECHOL PVSAT->FIO2 PVSAT->SAO2 SAO2->CATECHOL EXPCO2->ARTCO2 HR HR CATECHOL->HR HR->HRBP HR->HRSAT HR->CO HR->HREKG CO->BP HREKG->HRSAT
Diff with MIIC
G a->b overflow c->d Missing e->f reversed g->h Correct
In [7]:
bn3 = learner.useGreedyHillClimbing().useNMLCorrection().useScoreBDeu().learnBN()
gnb.flow.add(gnb.getBNDiff(bn, bn3, size="8!"), "Diff with GHC/NMD/BDEU")
gnb.flow.add(bnvsbn.graphDiffLegend())
gnb.flow.display()
G KINKEDTUBE KINKEDTUBE VENTLUNG VENTLUNG PRESS PRESS KINKEDTUBE->PRESS HYPOVOLEMIA HYPOVOLEMIA STROKEVOLUME STROKEVOLUME LVEDVOLUME LVEDVOLUME HYPOVOLEMIA->LVEDVOLUME INTUBATION INTUBATION INTUBATION->KINKEDTUBE VENTMACH VENTMACH INTUBATION->VENTMACH SHUNT SHUNT INTUBATION->SHUNT MINVOL MINVOL INTUBATION->MINVOL INTUBATION->PRESS VENTALV VENTALV MINVOLSET MINVOLSET PULMEMBOLUS PULMEMBOLUS PAP PAP PULMEMBOLUS->PAP PULMEMBOLUS->SHUNT INSUFFANESTH INSUFFANESTH CATECHOL CATECHOL INSUFFANESTH->CATECHOL ERRLOWOUTPUT ERRLOWOUTPUT HRBP HRBP ERRCAUTER ERRCAUTER ERRCAUTER->HRBP HRSAT HRSAT ERRCAUTER->HRSAT HREKG HREKG FIO2 FIO2 PVSAT PVSAT FIO2->PVSAT LVFAILURE LVFAILURE LVFAILURE->STROKEVOLUME HISTORY HISTORY DISCONNECT DISCONNECT DISCONNECT->LVFAILURE VENTTUBE VENTTUBE DISCONNECT->VENTTUBE DISCONNECT->VENTLUNG ANAPHYLAXIS ANAPHYLAXIS TPR TPR STROKEVOLUME->HYPOVOLEMIA STROKEVOLUME->LVEDVOLUME STROKEVOLUME->HISTORY CO CO STROKEVOLUME->CO TPR->ANAPHYLAXIS BP BP TPR->BP LVEDVOLUME->LVFAILURE PCWP PCWP LVEDVOLUME->PCWP LVEDVOLUME->HISTORY CVP CVP LVEDVOLUME->CVP VENTMACH->MINVOLSET VENTMACH->VENTTUBE SHUNT->STROKEVOLUME SAO2 SAO2 SHUNT->SAO2 HISTORY->LVFAILURE VENTTUBE->KINKEDTUBE VENTTUBE->PRESS VENTLUNG->KINKEDTUBE VENTLUNG->INTUBATION VENTLUNG->VENTMACH VENTLUNG->VENTTUBE VENTLUNG->MINVOL VENTLUNG->VENTALV EXPCO2 EXPCO2 VENTLUNG->EXPCO2 VENTALV->INTUBATION VENTALV->MINVOL ARTCO2 ARTCO2 VENTALV->ARTCO2 VENTALV->PVSAT ARTCO2->EXPCO2 ARTCO2->CATECHOL PVSAT->SAO2 SAO2->CATECHOL SAO2->HREKG CATECHOL->TPR HR HR HR->ERRLOWOUTPUT HR->CATECHOL HR->CO HR->HREKG HRBP->ERRLOWOUTPUT HRBP->HR HRSAT->HR HRSAT->HRBP CO->BP HREKG->ERRCAUTER HREKG->HRBP HREKG->HRSAT
Diff with GHC/NMD/BDEU
G a->b overflow c->d Missing e->f reversed g->h Correct
In [8]:
bn4 = learner.useGreedyHillClimbing().useNMLCorrection().useScoreBDeu().setInitialDAG(bn2.dag()).learnBN()
gnb.flow.add(gnb.getBNDiff(bn, bn4, size="8!"), "Diff with GHC/NMD/BDEU with intial DAG from MIIC")
gnb.flow.add(bnvsbn.graphDiffLegend())
gnb.flow.display()
G KINKEDTUBE KINKEDTUBE VENTLUNG VENTLUNG KINKEDTUBE->VENTLUNG PRESS PRESS KINKEDTUBE->PRESS HYPOVOLEMIA HYPOVOLEMIA STROKEVOLUME STROKEVOLUME HYPOVOLEMIA->STROKEVOLUME LVEDVOLUME LVEDVOLUME HYPOVOLEMIA->LVEDVOLUME INTUBATION INTUBATION SHUNT SHUNT INTUBATION->SHUNT MINVOL MINVOL INTUBATION->PRESS VENTALV VENTALV MINVOLSET MINVOLSET VENTMACH VENTMACH MINVOLSET->VENTMACH PULMEMBOLUS PULMEMBOLUS PAP PAP PULMEMBOLUS->PAP PULMEMBOLUS->SHUNT INSUFFANESTH INSUFFANESTH CATECHOL CATECHOL INSUFFANESTH->CATECHOL ERRLOWOUTPUT ERRLOWOUTPUT HRBP HRBP ERRLOWOUTPUT->HRBP ERRCAUTER ERRCAUTER HRSAT HRSAT ERRCAUTER->HRSAT HREKG HREKG ERRCAUTER->HREKG FIO2 FIO2 PVSAT PVSAT FIO2->PVSAT LVFAILURE LVFAILURE LVFAILURE->STROKEVOLUME LVFAILURE->LVEDVOLUME HISTORY HISTORY DISCONNECT DISCONNECT DISCONNECT->LVFAILURE VENTTUBE VENTTUBE DISCONNECT->VENTTUBE ANAPHYLAXIS ANAPHYLAXIS TPR TPR STROKEVOLUME->SHUNT CO CO STROKEVOLUME->CO TPR->ANAPHYLAXIS BP BP TPR->BP PCWP PCWP LVEDVOLUME->PCWP CVP CVP LVEDVOLUME->CVP VENTMACH->VENTTUBE SAO2 SAO2 SHUNT->SAO2 HISTORY->LVFAILURE VENTTUBE->INTUBATION VENTTUBE->VENTLUNG VENTTUBE->PRESS VENTLUNG->INTUBATION VENTLUNG->MINVOL VENTLUNG->VENTALV ARTCO2 ARTCO2 VENTLUNG->ARTCO2 EXPCO2 EXPCO2 VENTLUNG->EXPCO2 MINVOL->INTUBATION VENTALV->INTUBATION VENTALV->MINVOL VENTALV->ARTCO2 VENTALV->PVSAT ARTCO2->EXPCO2 ARTCO2->CATECHOL PVSAT->SAO2 SAO2->CATECHOL CATECHOL->TPR HR HR CATECHOL->HR HR->HRBP HR->HRSAT HR->CO HR->HREKG CO->BP HREKG->HRSAT
Diff with GHC/NMD/BDEU with intial DAG from MIIC
G a->b overflow c->d Missing e->f reversed g->h Correct
In [9]:
print(bn2.names())
{'HREKG', 'LVFAILURE', 'PVSAT', 'DISCONNECT', 'LVEDVOLUME', 'HYPOVOLEMIA', 'INSUFFANESTH', 'ERRCAUTER', 'ERRLOWOUTPUT', 'BP', 'HR', 'VENTMACH', 'STROKEVOLUME', 'HISTORY', 'CVP', 'PULMEMBOLUS', 'VENTTUBE', 'PCWP', 'INTUBATION', 'TPR', 'CATECHOL', 'EXPCO2', 'ANAPHYLAXIS', 'CO', 'ARTCO2', 'MINVOL', 'KINKEDTUBE', 'HRBP', 'SHUNT', 'PAP', 'SAO2', 'VENTALV', 'PRESS', 'VENTLUNG', 'FIO2', 'HRSAT', 'MINVOLSET'}
In [10]:
gnb.showInference(bn2, evs={}, size="10")
../_images/notebooks_32-Learning_learningClassifier_13_0.svg

Two classifiers from the learned BN

In [11]:
print(bn2["HRSAT"])
print(bn2["INTUBATION"])
HRSAT:Labelized({HIGH|LOW|NORMAL})
INTUBATION:Labelized({ESOPHAGEAL|NORMAL|ONESIDED})
In [12]:
showROC(bn2, "out/train.csv", "HRSAT", "LOW", show_progress=False)
showROC(bn2, "out/train.csv", "HRSAT", "NORMAL", show_progress=False)
showROC(bn2, "out/train.csv", "HRSAT", "HIGH", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_16_0.svg
../_images/notebooks_32-Learning_learningClassifier_16_1.svg
../_images/notebooks_32-Learning_learningClassifier_16_2.svg
In [13]:
showROC(bn2, "out/train.csv", "INTUBATION", "ESOPHAGEAL", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_17_0.svg
In [14]:
showPR(bn2, "out/train.csv", "HRSAT", "LOW", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_18_0.svg
In [15]:
showPR(bn2, "out/train.csv", "INTUBATION", "ESOPHAGEAL", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_19_0.svg
In [16]:
showROC_PR(bn2, "out/train.csv", "HRSAT", "LOW", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_20_0.svg
In [17]:
showROC_PR(bn2, "out/train.csv", "INTUBATION", "ESOPHAGEAL", show_progress=False);
../_images/notebooks_32-Learning_learningClassifier_21_0.svg