There are numerous algorithms proposed in the literature for learning causal graphical probabilistic
models. Each one of them is typically equipped with one or more tuning hyper-parameters. The
choice of optimal algorithm and hyper-parameter values is not universal; it depends on the size
of the network, the density of the true causal structure, the sample size, as well as the metric of
quality of learning a causal structure. Thus, the challenge to a practitioner is how to “tune” these
choices, given that the true graph is unknown and the learning task is unsupervised. In the paper,
we evaluate two previously proposed methods for tuning, one based on stability of the learned
structure under perturbations (bootstrapping) of the input data and the other based on balancing the
in-sample fitting of the model with the model complexity. We propose and comparatively evaluate
a new method that treats a causal model as a set of predictive models: one for each node given its
Markov Blanket. It then tunes the choices using out-of-sample protocols for supervised methods
such as cross-validation. The proposed method performs on par or better than the previous methods
for most metrics.
%0 Journal Article
%1 noauthororeditor
%A Biza, K.
%A Tsamardinos, I.
%A Triantafillou, S.
%D 2020
%J Proceedings of the Tenth International Conference on Probabilistic Graphical Models, in PMLR
%K mxmcausalpath
%T Tuning Causal Discovery Algorithms
%U https://pgm2020.cs.aau.dk/wp-content/uploads/2020/09/biza20.pdf
%X There are numerous algorithms proposed in the literature for learning causal graphical probabilistic
models. Each one of them is typically equipped with one or more tuning hyper-parameters. The
choice of optimal algorithm and hyper-parameter values is not universal; it depends on the size
of the network, the density of the true causal structure, the sample size, as well as the metric of
quality of learning a causal structure. Thus, the challenge to a practitioner is how to “tune” these
choices, given that the true graph is unknown and the learning task is unsupervised. In the paper,
we evaluate two previously proposed methods for tuning, one based on stability of the learned
structure under perturbations (bootstrapping) of the input data and the other based on balancing the
in-sample fitting of the model with the model complexity. We propose and comparatively evaluate
a new method that treats a causal model as a set of predictive models: one for each node given its
Markov Blanket. It then tunes the choices using out-of-sample protocols for supervised methods
such as cross-validation. The proposed method performs on par or better than the previous methods
for most metrics.
@article{noauthororeditor,
abstract = {There are numerous algorithms proposed in the literature for learning causal graphical probabilistic
models. Each one of them is typically equipped with one or more tuning hyper-parameters. The
choice of optimal algorithm and hyper-parameter values is not universal; it depends on the size
of the network, the density of the true causal structure, the sample size, as well as the metric of
quality of learning a causal structure. Thus, the challenge to a practitioner is how to “tune” these
choices, given that the true graph is unknown and the learning task is unsupervised. In the paper,
we evaluate two previously proposed methods for tuning, one based on stability of the learned
structure under perturbations (bootstrapping) of the input data and the other based on balancing the
in-sample fitting of the model with the model complexity. We propose and comparatively evaluate
a new method that treats a causal model as a set of predictive models: one for each node given its
Markov Blanket. It then tunes the choices using out-of-sample protocols for supervised methods
such as cross-validation. The proposed method performs on par or better than the previous methods
for most metrics.},
added-at = {2020-09-08T10:21:24.000+0200},
author = {Biza, K. and Tsamardinos, I. and Triantafillou, S.},
biburl = {https://www.bibsonomy.org/bibtex/227a19344432d6e2831ae6fac806fe077/mensxmachina},
interhash = {8a79a42946abf9f62c4d45b8110b6a94},
intrahash = {27a19344432d6e2831ae6fac806fe077},
journal = {Proceedings of the Tenth International Conference on Probabilistic Graphical Models, in PMLR},
keywords = {mxmcausalpath},
timestamp = {2021-03-08T12:02:38.000+0100},
title = {Tuning Causal Discovery Algorithms},
url = {https://pgm2020.cs.aau.dk/wp-content/uploads/2020/09/biza20.pdf},
year = 2020
}