@article {114, title = {A structural variation reference for medical and population genetics.}, journal = {Nature}, volume = {581}, year = {2020}, month = {2020 05}, pages = {444-451}, abstract = {

Structural variants (SVs) rearrange large segments of DNA and can have profound consequences in evolution and human disease. As national biobanks, disease-association studies, and clinical genetic testing have grown increasingly reliant on genome sequencing, population references such as the Genome Aggregation Database (gnomAD) have become integral in the interpretation of single-nucleotide variants (SNVs). However, there are no reference maps of SVs from high-coverage genome sequencing comparable to those for SNVs. Here we present a reference of sequence-resolved SVs constructed from 14,891 genomes across diverse global populations (54\% non-European) in gnomAD. We discovered a rich and complex landscape of 433,371 SVs, from which we estimate that SVs are responsible for 25-29\% of all rare protein-truncating events per genome. We found strong correlations between natural selection against damaging SNVs and rare SVs that disrupt or duplicate protein-coding sequence, which suggests that genes that are highly intolerant to loss-of-function are also sensitive to increased dosage. We also uncovered modest selection against noncoding SVs in cis-regulatory elements, although selection against protein-truncating SVs was stronger than all noncoding effects. Finally, we identified very large (over one megabase), rare SVs in 3.9\% of samples, and estimate that 0.13\% of individuals may carry an SV that meets the existing criteria for clinically important incidental findings. This SV resource is freely distributed via the gnomAD browser and will have broad utility in population genetics, disease-association studies, and diagnostic screening.

}, keywords = {Continental Population Groups, Disease, Female, Genetic Testing, Genetic Variation, Genetics, Medical, Genetics, Population, Genome, Human, Genotyping Techniques, Humans, Male, Middle Aged, Mutation, Polymorphism, Single Nucleotide, Reference Standards, Selection, Genetic, Whole Genome Sequencing}, issn = {1476-4687}, doi = {10.1038/s41586-020-2287-8}, author = {Collins, Ryan L and Brand, Harrison and Karczewski, Konrad J and Zhao, Xuefang and Alf{\"o}ldi, Jessica and Francioli, Laurent C and Khera, Amit V and Lowther, Chelsea and Gauthier, Laura D and Wang, Harold and Watts, Nicholas A and Solomonson, Matthew and O{\textquoteright}Donnell-Luria, Anne and Baumann, Alexander and Munshi, Ruchi and Walker, Mark and Whelan, Christopher W and Huang, Yongqing and Brookings, Ted and Sharpe, Ted and Stone, Matthew R and Valkanas, Elise and Fu, Jack and Tiao, Grace and Laricchia, Kristen M and Ruano-Rubio, Valentin and Stevens, Christine and Gupta, Namrata and Cusick, Caroline and Margolin, Lauren and Taylor, Kent D and Lin, Henry J and Rich, Stephen S and Post, Wendy S and Chen, Yii-Der Ida and Rotter, Jerome I and Nusbaum, Chad and Philippakis, Anthony and Lander, Eric and Gabriel, Stacey and Neale, Benjamin M and Kathiresan, Sekar and Daly, Mark J and Banks, Eric and MacArthur, Daniel G and Talkowski, Michael E} }