@article {Boyrie2020.02.14.949206, author = {L{\'e}a Boyrie and Corentin Moreau and Florian Frugier and Christophe Jacquet and Maxime Bonhomme}, title = {A fast linkage disequilibrium-based statistical test for Genome-Wide Epistatic Selection Scans in structured populations}, elocation-id = {2020.02.14.949206}, year = {2020}, doi = {10.1101/2020.02.14.949206}, publisher = {Cold Spring Harbor Laboratory}, abstract = {The quest for genome-wide signatures of selection in populations using SNP data has proven efficient to uncover genes involved in conserved or adaptive molecular functions, but none of the statistical methods were designed to identify interacting genes as targets of selective processes. Here, we propose a straightforward statistical test aimed at detecting epistatic selection, based on a linkage disequilibrium (LD) measure accounting for population structure and heterogeneous relatedness between individuals. SNP-based (Trv) and window-based (TcorPC1v) statistics fit a Student distribution, allowing to easily and quickly test the significance of correlation coefficients in the frame of Genome-Wide Epistatic Selection Scans (GWESS) using candidate genes as baits. As a proof of concept, use of SNP data from the Medicago truncatula symbiotic legume plant uncovered a previously unknown gene coadaptation between the MtSUNN (Super Numeric Nodule) receptor and the MtCLE02 (CLAVATA3-Like) signalling peptide, and experimental evidence accordingly supported a MtSUNN-dependent negative role of MtCLE02 in symbiotic root nodulation. Using human HGDP-CEPH SNP data, our new statistical test uncovered strong LD between SLC24A5 and EDAR worldwide, which persists after correction for population structure and relatedness in Central South Asian populations. This result suggests adaptive genetic interaction or coselection between skin pigmentation and the ectodysplasin pathway involved in the development of ectodermal organs (hairs, teeth, sweat glands), in some human populations. Applying this approach to genome-wide SNP data will foster the identification of evolutionary coadapted gene networks.Author summary Population genomic methods have allowed to identify many genes associated with adaptive processes in populations with complex histories. However, they are not designed to identify gene coadaptation between genes through epistatic selection, in structured populations. To tackle this problem, we developed a straightforward LD-based statistical test accounting for population structure and heterogeneous relatedness between individuals, using SNP-based (Trv) or windows-based (TcorPC1v) statistics. This allows easily and quickly testing for significance of correlation coefficients between polymorphic loci in the frame of Genome Wide Epistatic Selection Scans (GWESS). Following detection of gene coadaptation using SNP data from human and the model plant Medicago truncatula, we report experimental evidence of genetic interaction between two receptors involved in the regulation of root nodule symbiosis in Medicago truncatula. This test opens new avenues for exploring the evolution of genes as interacting units and thus paves the way to infer new networks based on evolutionary coadaptation between genes.}, URL = {https://www.biorxiv.org/content/early/2020/02/14/2020.02.14.949206}, eprint = {https://www.biorxiv.org/content/early/2020/02/14/2020.02.14.949206.full.pdf}, journal = {bioRxiv} }