@article {Sinai2021.04.16.440236, author = {Sam Sinai and Nina Jain and George M Church and Eric D Kelsic}, title = {Generative AAV capsid diversification by latent interpolation}, elocation-id = {2021.04.16.440236}, year = {2021}, doi = {10.1101/2021.04.16.440236}, publisher = {Cold Spring Harbor Laboratory}, abstract = {Adeno-associated virus (AAV) capsids have shown clinical promise as delivery vectors for gene therapy. However, the high prevalence of pre-existing immunity against natural capsids poses a challenge for widespread treatment. The generation of diverse capsids that are potentially more capable of immune evasion is challenging because introducing multiple mutations often breaks capsid assembly. Here we target a representative, immunologically relevant 28-amino-acid segment of the AAV2 capsid and show that a low-complexity Variational Auto-encoder (VAE) can interpolate in sequence space to produce diverse and novel capsids capable of packaging their own genomes. We first train the VAE on a 564-sample Multiple-Sequence Alignment (MSA) of dependo-parvoviruses, and then further augment this dataset by adding 22,704 samples from a deep mutational exploration (DME) on the target region. In both cases the VAE generated viable variants with many mutations, which we validated experimentally. We propose that this simple approach can be used to optimize and diversify other proteins, as well as other capsid traits of interest for gene delivery.Competing Interest StatementEK, NJ, SS, GMC performed research while at Harvard University and EK, SS also performed research while at Dyno Therapeutics. EK, SS, and GMC hold equity at Dyno Therapeutics. A full list of GMCs tech transfer, advisory roles, and funding sources can be found on the labs website: http://arep.med.harvard.edu/gmc/tech.html. Harvard University has filed a patent application for inventions related to this work.}, URL = {https://www.biorxiv.org/content/early/2021/04/17/2021.04.16.440236}, eprint = {https://www.biorxiv.org/content/early/2021/04/17/2021.04.16.440236.full.pdf}, journal = {bioRxiv} }