@article {Lukassen740415, author = {Soeren Lukassen and Foo Wei Ten and Roland Eils and Christian Conrad}, title = {Gene set inference from single-cell sequencing data using a hybrid of matrix factorization and variational autoencoders}, elocation-id = {740415}, year = {2019}, doi = {10.1101/740415}, publisher = {Cold Spring Harbor Laboratory}, abstract = {Recent advances in single-cell RNA sequencing (scRNA-Seq) have driven the simultaneous measurement of the expression of 1,000s of genes in 1,000s of single cells. These growing data sets allow us to model gene sets in biological networks at an unprecedented level of detail, in spite of heterogenous cell populations. Here, we propose an unsupervised deep neural network model that is a hybrid of matrix factorization and conditional variational autoencoders (CVA), which utilizes weights as matrix factorizations to obtain gene sets, while class-specific inputs to the latent variable space facilitate a plausible identification of cell types. This artificial neural network model seamlessly integrates functional gene set inference, experimental batch effect correction, and static gene identification, which we conceptually prove here for three single-cell RNA-Seq datasets and suggest for future single-cell-gene analytics.}, URL = {https://www.biorxiv.org/content/early/2019/09/02/740415}, eprint = {https://www.biorxiv.org/content/early/2019/09/02/740415.full.pdf}, journal = {bioRxiv} }