@article {Ramazzotti041343, author = {Daniele Ramazzotti and Alex Graudenzi and Giulio Caravagna and Marco Antoniotti}, title = {Modeling cumulative biological phenomena with Suppes-Bayes Causal Networks}, elocation-id = {041343}, year = {2017}, doi = {10.1101/041343}, publisher = {Cold Spring Harbor Laboratory}, abstract = {Several diseases related to cell proliferation are characterized by the accumulation of somatic DNA changes, with respect to wildtype conditions. Cancer and HIV are two common examples of such diseases, where the mutational load in the cancerous/viral population increases over time. In these cases, selective pres sures are often observed along with competition, co-operation and parasitism among distinct cellular clones. Recently, we presented a mathematical framework to model these phenomena, based on a combination of Bayesian inference and Suppes{\textquoteright} theory of probabilistic causation, depicted in graphical structures dubbed Suppes-Bayes Causal Networks (SBCNs). SBCNs are generative probabilistic graphical models that recapitulate the potential ordering of accumulation of such DNA changes during the progression of the disease. Such models can be inferred from data by exploiting likelihood-based model-selection strategies with regularization. In this paper we discuss the theoretical foun dations of our approach and we investigate in depth the influence on the model-selection task of: (i) the poset based on Suppes{\textquoteright} theory and (ii) different regulariza tion strategies. Furthermore, we provide an example of application of our framework to HIV genetic data highlighting the valuable insights provided by the inferred SBCN.}, URL = {https://www.biorxiv.org/content/early/2017/03/08/041343}, eprint = {https://www.biorxiv.org/content/early/2017/03/08/041343.full.pdf}, journal = {bioRxiv} }