@article {Yang770958, author = {Yalan Yang and Jinmin Lian and Bingkun Xie and Muya Chen and Yongchao Niu and Qiaowei Li and Yuwen Liu and Guoqiang Yi and Xinhao Fan and Yijie Tang and Jiang Li and Ivan Liachko and Shawn T. Sullivan and Bradley Nelson and Erwei Zuo and Zhonglin Tang}, title = {Chromosome-scale de novo assembly and phasing of a Chinese indigenous pig genome}, elocation-id = {770958}, year = {2019}, doi = {10.1101/770958}, publisher = {Cold Spring Harbor Laboratory}, abstract = {Chinese indigenous pigs differ significantly from Western commercial pig breeds in phenotypic and genomic characteristics. Thus, building a high-quality reference genome for Chinese indigenous pigs is pivotal to exploring gene function, genome evolution and improving genetic breeding in pigs. Here, we report an ultrahigh-quality phased chromosome-scale genome assembly for a male Luchuan pig, a representative Chinese domestic breed, by generating and combining data from PacBio Sequel reads, Illumina paired-end reads, high-throughput chromatin conformation capture and BioNano optical map. The primary assembly is \~{} 2.58 Gb in size with contig and scaffold N50s of 18.03 Mb and 140.09 Mb, respectively. Comparison between primary assembly and alternative haplotig reveals numerous haplotype-specific alleles, which provide a rich resource to study the allele-specific expression, epigenetic regulation, genome structure and evolution of pigs. Gene enrichment analysis indicates that the Luchuan-specific genes are predominantly enriched in Gene Ontology terms for phosphoprotein phosphatase activity, signaling receptor activity and phosphatidylinositol binding. We provide clear molecular evolutionary evidence that the divergence time between Luchuan and Duroc pigs is dated back to about 1.7 million years ago. Meanwhile, Luchuan exhibits fewer events of gene family expansion and stronger gene family contraction than Duroc. The positively selected genes (PSGs) in Luchuan pig significantly enrich for protein tyrosine kinase activity, microtubule motor activity, GTPase activator activity and ubiquitin-protein transferase activity, whereas the PSGs in Duroc pig enrich for G-protein coupled receptor activity. Overall, our findings not only provide key benchmark data for the pig genetics community, but also pave a new avenue for utilizing porcine biomedical models to study human health and diseases.}, URL = {https://www.biorxiv.org/content/early/2019/09/16/770958}, eprint = {https://www.biorxiv.org/content/early/2019/09/16/770958.full.pdf}, journal = {bioRxiv} }