Accurately modeling cellular response to perturbations is a central goal of computational biology. While such modeling has been proposed based on statistical, mechanistic and machine learning models in specific settings, no generalization of predictions to phenomena absent from training data i.e. ‘out-of-sample’ have yet been demonstrated. Here, we present scGen, a model combining variational autoencoders and latent space vector arithmetics for high-dimensional single-cell gene expression data. In benchmarks across a broad range of examples, we show that scGen accurately models dose and infection response of cells across cell types, studies and species. In particular, we demonstrate that scGen learns cell type and species specific response implying that it captures features that distinguish responding from non-responding genes and cells. With the upcoming availability of large-scale atlases of organs in healthy state, we envision scGen to become a tool for experimental design through in silico screening of perturbation response in the context of disease and drug treatment.
Description
Generative modeling and latent space arithmetics predict single-cell perturbation response across cell types, studies and species | bioRxiv
%0 Journal Article
%1 lotfollahi2018generative
%A Lotfollahi, M.
%A Wolf, F. Alexander
%A Theis, Fabian J.
%D 2018
%I Cold Spring Harbor Laboratory
%J bioRxiv
%K afcs bayesian cell cvae gan generative model response single vae
%R 10.1101/478503
%T Generative modeling and latent space arithmetics predict single-cell perturbation response across cell types, studies and species
%U https://www.biorxiv.org/content/early/2018/11/29/478503
%X Accurately modeling cellular response to perturbations is a central goal of computational biology. While such modeling has been proposed based on statistical, mechanistic and machine learning models in specific settings, no generalization of predictions to phenomena absent from training data i.e. ‘out-of-sample’ have yet been demonstrated. Here, we present scGen, a model combining variational autoencoders and latent space vector arithmetics for high-dimensional single-cell gene expression data. In benchmarks across a broad range of examples, we show that scGen accurately models dose and infection response of cells across cell types, studies and species. In particular, we demonstrate that scGen learns cell type and species specific response implying that it captures features that distinguish responding from non-responding genes and cells. With the upcoming availability of large-scale atlases of organs in healthy state, we envision scGen to become a tool for experimental design through in silico screening of perturbation response in the context of disease and drug treatment.
@article{lotfollahi2018generative,
abstract = {Accurately modeling cellular response to perturbations is a central goal of computational biology. While such modeling has been proposed based on statistical, mechanistic and machine learning models in specific settings, no generalization of predictions to phenomena absent from training data i.e. {\textquoteleft}out-of-sample{\textquoteright} have yet been demonstrated. Here, we present scGen, a model combining variational autoencoders and latent space vector arithmetics for high-dimensional single-cell gene expression data. In benchmarks across a broad range of examples, we show that scGen accurately models dose and infection response of cells across cell types, studies and species. In particular, we demonstrate that scGen learns cell type and species specific response implying that it captures features that distinguish responding from non-responding genes and cells. With the upcoming availability of large-scale atlases of organs in healthy state, we envision scGen to become a tool for experimental design through in silico screening of perturbation response in the context of disease and drug treatment.},
added-at = {2019-06-19T00:25:00.000+0200},
author = {Lotfollahi, M. and Wolf, F. Alexander and Theis, Fabian J.},
biburl = {https://www.bibsonomy.org/bibtex/21efc8e94312ecf7a8b19122b398904bf/becker},
description = {Generative modeling and latent space arithmetics predict single-cell perturbation response across cell types, studies and species | bioRxiv},
doi = {10.1101/478503},
elocation-id = {478503},
eprint = {https://www.biorxiv.org/content/early/2018/11/29/478503.full.pdf},
interhash = {8642ec1b78dcd91c23010f0051cdf1e5},
intrahash = {1efc8e94312ecf7a8b19122b398904bf},
journal = {bioRxiv},
keywords = {afcs bayesian cell cvae gan generative model response single vae},
publisher = {Cold Spring Harbor Laboratory},
timestamp = {2019-06-24T06:44:49.000+0200},
title = {Generative modeling and latent space arithmetics predict single-cell perturbation response across cell types, studies and species},
url = {https://www.biorxiv.org/content/early/2018/11/29/478503},
year = 2018
}