@article {112, title = {Major Impacts of Widespread Structural Variation on Gene Expression and Crop Improvement in Tomato.}, journal = {Cell}, volume = {182}, year = {2020}, month = {2020 07 09}, pages = {145-161.e23}, abstract = {

Structural variants (SVs) underlie important crop improvement and domestication traits. However, resolving the extent, diversity, and quantitative impact of SVs has been challenging. We used long-read nanopore sequencing to capture 238,490 SVs in 100 diverse tomato lines. This panSV genome, along with 14 new reference assemblies, revealed large-scale intermixing of diverse genotypes, as well as thousands of SVs intersecting genes and cis-regulatory regions. Hundreds of SV-gene pairs exhibit subtle and significant expression changes, which could broadly influence quantitative trait variation. By combining quantitative genetics with genome editing, we show how multiple SVs that changed gene dosage and expression levels modified fruit flavor, size, and production. In the last example, higher order epistasis among four SVs affecting three related transcription factors allowed introduction of an important harvesting trait in modern tomato. Our findings highlight the underexplored role of SVs in genotype-to-phenotype relationships and their widespread importance and utility in crop improvement.

}, keywords = {Alleles, Crops, Agricultural, Cytochrome P-450 Enzyme System, Ecotype, Epistasis, Genetic, Fruit, Gene Duplication, Gene Expression Regulation, Plant, Genome, Plant, Genomic Structural Variation, Genotype, Inbreeding, Lycopersicon esculentum, Molecular Sequence Annotation, Phenotype, Plant Breeding, Quantitative Trait Loci}, issn = {1097-4172}, doi = {10.1016/j.cell.2020.05.021}, author = {Alonge, Michael and Wang, Xingang and Benoit, Matthias and Soyk, Sebastian and Pereira, Lara and Zhang, Lei and Suresh, Hamsini and Ramakrishnan, Srividya and Maumus, Florian and Ciren, Danielle and Levy, Yuval and Harel, Tom Hai and Shalev-Schlosser, Gili and Amsellem, Ziva and Razifard, Hamid and Caicedo, Ana L and Tieman, Denise M and Klee, Harry and Kirsche, Melanie and Aganezov, Sergey and Ranallo-Benavidez, T Rhyker and Lemmon, Zachary H and Kim, Jennifer and Robitaille, Gina and Kramer, Melissa and Goodwin, Sara and McCombie, W Richard and Hutton, Samuel and Van Eck, Joyce and Gillis, Jesse and Eshed, Yuval and Sedlazeck, Fritz J and van der Knaap, Esther and Schatz, Michael C and Lippman, Zachary B} } @article {122, title = {Mapping and characterization of structural variation in 17,795 human genomes.}, journal = {Nature}, volume = {583}, year = {2020}, month = {2020 07}, pages = {83-89}, abstract = {

A key goal of whole-genome sequencing for studies of human genetics is to interrogate all forms of variation, including single-nucleotide variants, small insertion or deletion (indel) variants and structural variants. However, tools and resources for the study of structural variants have lagged behind those for smaller variants. Here we used a scalable pipeline to map and characterize structural variants in 17,795 deeply sequenced human genomes. We publicly release site-frequency data to create the largest, to our knowledge, whole-genome-sequencing-based structural variant resource so far. On average, individuals carry 2.9 rare structural variants that alter coding regions; these variants affect the dosage or structure of 4.2 genes and account for 4.0-11.2\% of rare high-impact coding alleles. Using a computational model, we estimate that structural variants account for 17.2\% of rare alleles genome-wide, with predicted deleterious effects that are equivalent to loss-of-function coding alleles; approximately 90\% of such structural variants are noncoding deletions (mean 19.1 per genome). We report 158,991 ultra-rare structural variants and show that 2\% of individuals carry ultra-rare megabase-scale structural variants, nearly half of which are balanced or complex rearrangements. Finally, we infer the dosage sensitivity of genes and noncoding elements, and reveal trends that relate to element class and conservation. This work will help to guide the analysis and interpretation of structural variants in the era of whole-genome sequencing.

}, keywords = {Alleles, Case-Control Studies, Continental Population Groups, Epigenesis, Genetic, Female, Gene Dosage, Genetic Variation, Genetics, Population, Genome, Human, High-Throughput Nucleotide Sequencing, Humans, Male, Molecular Sequence Annotation, Quantitative Trait Loci, Software, Whole Genome Sequencing}, issn = {1476-4687}, doi = {10.1038/s41586-020-2371-0}, author = {Abel, Haley J and Larson, David E and Regier, Allison A and Chiang, Colby and Das, Indraniel and Kanchi, Krishna L and Layer, Ryan M and Neale, Benjamin M and Salerno, William J and Reeves, Catherine and Buyske, Steven and Matise, Tara C and Muzny, Donna M and Zody, Michael C and Lander, Eric S and Dutcher, Susan K and Stitziel, Nathan O and Hall, Ira M} } @article {131, title = {A missense variant in Mitochondrial Amidoxime Reducing Component 1 gene and protection against liver disease.}, journal = {PLoS Genet}, volume = {16}, year = {2020}, month = {2020 04}, pages = {e1008629}, abstract = {

Analyzing 12,361 all-cause cirrhosis cases and 790,095 controls from eight cohorts, we identify a common missense variant in the Mitochondrial Amidoxime Reducing Component 1 gene (MARC1 p.A165T) that associates with protection from all-cause cirrhosis (OR 0.91, p = 2.3*10-11). This same variant also associates with lower levels of hepatic fat on computed tomographic imaging and lower odds of physician-diagnosed fatty liver as well as lower blood levels of alanine transaminase (-0.025 SD, 3.7*10-43), alkaline phosphatase (-0.025 SD, 1.2*10-37), total cholesterol (-0.030 SD, p = 1.9*10-36) and LDL cholesterol (-0.027 SD, p = 5.1*10-30) levels. We identified a series of additional MARC1 alleles (low-frequency missense p.M187K and rare protein-truncating p.R200Ter) that also associated with lower cholesterol levels, liver enzyme levels and reduced risk of cirrhosis (0 cirrhosis cases for 238 R200Ter carriers versus 17,046 cases of cirrhosis among 759,027 non-carriers, p = 0.04) suggesting that deficiency of the MARC1 enzyme may lower blood cholesterol levels and protect against cirrhosis.

}, keywords = {Alleles, Cholesterol, LDL, Coronary Artery Disease, Datasets as Topic, Fatty Liver, Female, Genetic Predisposition to Disease, Homozygote, Humans, Liver, Liver Cirrhosis, Liver Cirrhosis, Alcoholic, Loss of Function Mutation, Male, Middle Aged, Mitochondrial Proteins, Mutation, Missense, Oxidoreductases}, issn = {1553-7404}, doi = {10.1371/journal.pgen.1008629}, author = {Emdin, Connor A and Haas, Mary E and Khera, Amit V and Aragam, Krishna and Chaffin, Mark and Klarin, Derek and Hindy, George and Jiang, Lan and Wei, Wei-Qi and Feng, Qiping and Karjalainen, Juha and Havulinna, Aki and Kiiskinen, Tuomo and Bick, Alexander and Ardissino, Diego and Wilson, James G and Schunkert, Heribert and McPherson, Ruth and Watkins, Hugh and Elosua, Roberto and Bown, Matthew J and Samani, Nilesh J and Baber, Usman and Erdmann, Jeanette and Gupta, Namrata and Danesh, John and Saleheen, Danish and Chang, Kyong-Mi and Vujkovic, Marijana and Voight, Ben and Damrauer, Scott and Lynch, Julie and Kaplan, David and Serper, Marina and Tsao, Philip and Mercader, Josep and Hanis, Craig and Daly, Mark and Denny, Joshua and Gabriel, Stacey and Kathiresan, Sekar} } @article {68, title = {Mendelian Gene Discovery: Fast and Furious with No End in Sight.}, journal = {Am J Hum Genet}, volume = {105}, year = {2019}, month = {2019 Sep 05}, pages = {448-455}, abstract = {

Gene discovery for Mendelian conditions (MCs) offers a direct path to understanding genome function. Approaches based on next-generation sequencing applied at scale have dramatically accelerated gene discovery and transformed genetic medicine. Finding the genetic basis of \~{}6,000-13,000 MCs yet to be delineated will require both technical and computational innovation, but will rely to a larger extent on meaningful data sharing.

}, issn = {1537-6605}, doi = {10.1016/j.ajhg.2019.07.011}, author = {Bamshad, Michael J and Nickerson, Deborah A and Chong, Jessica X} } @article {59, title = {Monogenic causes of chronic kidney disease in adults.}, journal = {Kidney Int}, volume = {95}, year = {2019}, month = {2019 Apr}, pages = {914-928}, abstract = {

Approximately 500 monogenic causes of chronic kidney disease (CKD) have been identified, mainly in pediatric populations. The frequency of monogenic causes among adults with CKD has been less extensively studied. To determine the likelihood of detecting monogenic causes of CKD in adults presenting to nephrology services in Ireland, we conducted whole exome sequencing (WES) in a multi-centre cohort of 114 families including 138 affected individuals with CKD. Affected adults were recruited from 78 families with a positive family history, 16 families with extra-renal features, and 20 families with neither a family history nor extra-renal features. We detected a pathogenic mutation in a known CKD gene in 42 of 114 families (37\%). A monogenic cause was identified in 36\% of affected families with a positive family history of CKD, 69\% of those with extra-renal features, and only 15\% of those without a family history or extra-renal features. There was no difference in the rate of genetic diagnosis in individuals with childhood versus adult onset CKD. Among the 42 families in whom a monogenic cause was identified, WES confirmed the clinical diagnosis in 17 (40\%), corrected the clinical diagnosis in 9 (22\%), and established a diagnosis for the first time in 16 families referred with CKD of unknown etiology (38\%). In this multi-centre study of adults with CKD, a molecular genetic diagnosis was established in over one-third of families. In the evolving era of precision medicine, WES may be an important tool to identify the cause of CKD in adults.

}, issn = {1523-1755}, doi = {10.1016/j.kint.2018.10.031}, author = {Connaughton, Dervla M and Kennedy, Claire and Shril, Shirlee and Mann, Nina and Murray, Susan L and Williams, Patrick A and Conlon, Eoin and Nakayama, Makiko and van der Ven, Amelie T and Ityel, Hadas and Kause, Franziska and Kolvenbach, Caroline M and Dai, Rufeng and Vivante, Asaf and Braun, Daniela A and Schneider, Ronen and Kitzler, Thomas M and Moloney, Brona and Moran, Conor P and Smyth, John S and Kennedy, Alan and Benson, Katherine and Stapleton, Caragh and Denton, Mark and Magee, Colm and O{\textquoteright}Seaghdha, Conall M and Plant, William D and Griffin, Matthew D and Awan, Atif and Sweeney, Clodagh and Mane, Shrikant M and Lifton, Richard P and Griffin, Brenda and Leavey, Sean and Casserly, Liam and de Freitas, Declan G and Holian, John and Dorman, Anthony and Doyle, Brendan and Lavin, Peter J and Little, Mark A and Conlon, Peter J and Hildebrandt, Friedhelm} } @article {71, title = {MSTO1 mutations cause mtDNA depletion, manifesting as muscular dystrophy with cerebellar involvement.}, journal = {Acta Neuropathol}, year = {2019}, month = {2019 Aug 29}, abstract = {

MSTO1 encodes a cytosolic mitochondrial fusion protein, misato homolog 1 or MSTO1. While the full genotype-phenotype spectrum remains to be explored, pathogenic variants in MSTO1 have recently been reported in a small number of patients presenting with a phenotype of cerebellar ataxia, congenital muscle involvement with histologic findings ranging from myopathic to dystrophic and pigmentary retinopathy. The proposed underlying pathogenic mechanism of MSTO1-related disease is suggestive of impaired mitochondrial fusion secondary to a loss of function of MSTO1. Disorders of mitochondrial fusion and fission have been shown to also lead to mitochondrial DNA (mtDNA) depletion, linking them to the mtDNA depletion syndromes, a clinically and genetically diverse class of mitochondrial diseases characterized by a reduction of cellular mtDNA content. However, the consequences of pathogenic variants in MSTO1 on mtDNA maintenance remain poorly understood. We present extensive phenotypic and genetic data from 12 independent families, including 15 new patients harbouring a broad array of bi-allelic MSTO1 pathogenic variants, and we provide functional characterization from seven MSTO1-related disease patient fibroblasts. Bi-allelic loss-of-function variants in MSTO1 manifest clinically with a remarkably consistent phenotype of childhood-onset muscular dystrophy, corticospinal tract dysfunction and early-onset non-progressive cerebellar atrophy. MSTO1 protein was not detectable in the cultured fibroblasts of all seven patients evaluated, suggesting that pathogenic variants result in a loss of protein expression and/or affect protein stability. Consistent with impaired mitochondrial fusion, mitochondrial networks in fibroblasts were found to be fragmented. Furthermore, all fibroblasts were found to have depletion of mtDNA ranging from 30 to 70\% along with alterations to mtDNA nucleoids. Our data corroborate the role of MSTO1 as a mitochondrial fusion protein and highlight a previously unrecognized link to mtDNA regulation. As impaired mitochondrial fusion is a recognized cause of mtDNA depletion syndromes, this novel link to mtDNA depletion in patient fibroblasts suggests that MSTO1-deficiency should also be considered a mtDNA depletion syndrome. Thus, we provide mechanistic insight into the disease pathogenesis associated with MSTO1 mutations and further define the clinical spectrum and the natural history of MSTO1-related disease.

}, issn = {1432-0533}, doi = {10.1007/s00401-019-02059-z}, author = {Donkervoort, S and Sabouny, R and Yun, P and Gauquelin, L and Chao, K R and Hu, Y and Al Khatib, I and T{\"o}pf, A and Mohassel, P and Cummings, B B and Kaur, R and Saade, D and Moore, S A and Waddell, L B and Farrar, M A and Goodrich, J K and Uapinyoying, P and Chan, S H S and Javed, A and Leach, M E and Karachunski, P and Dalton, J and Medne, L and Harper, A and Thompson, C and Thiffault, I and Specht, S and Lamont, R E and Saunders, C and Racher, H and Bernier, F P and Mowat, D and Witting, N and Vissing, J and Hanson, R and Coffman, K A and Hainlen, M and Parboosingh, J S and Carnevale, A and Yoon, G and Schnur, R E and Boycott, K M and Mah, J K and Straub, V and Foley, A Reghan and Innes, A M and B{\"o}nnemann, C G and Shutt, T E} } @article {52, title = {A multi-task convolutional deep neural network for variant calling in single molecule sequencing.}, journal = {Nat Commun}, volume = {10}, year = {2019}, month = {2019 03 01}, pages = {998}, abstract = {

The accurate identification of DNA sequence variants is an important, but challenging task in genomics. It is particularly difficult for single molecule sequencing, which has a per-nucleotide error rate of ~5-15\%. Meeting this demand, we developed Clairvoyante, a multi-task five-layer convolutional neural network model for predicting variant type (SNP or indel), zygosity, alternative allele and indel length from aligned reads. For the well-characterized NA12878 human sample, Clairvoyante achieves 99.67, 95.78, 90.53\% F1-score on 1KP common variants, and 98.65, 92.57, 87.26\% F1-score for whole-genome analysis, using Illumina, PacBio, and Oxford Nanopore data, respectively. Training on a second human sample shows Clairvoyante is sample agnostic and finds variants in less than 2 h on a standard server. Furthermore, we present 3,135 variants that are missed using Illumina but supported independently by both PacBio and Oxford Nanopore reads. Clairvoyante is available open-source ( https://github.com/aquaskyline/Clairvoyante ), with modules to train, utilize and visualize the model.

}, keywords = {Base Sequence, Computational Biology, DNA Mutational Analysis, Genome, Human, Genome-Wide Association Study, Genomics, Genotype, Genotyping Techniques, Humans, INDEL Mutation, Nanopores, Neural Networks (Computer), Polymorphism, Single Nucleotide, Sequence Analysis, DNA, Software}, issn = {2041-1723}, doi = {10.1038/s41467-019-09025-z}, author = {Luo, Ruibang and Sedlazeck, Fritz J and Lam, Tak-Wah and Schatz, Michael C} } @article {46, title = {Modified penetrance of coding variants by cis-regulatory variation contributes to disease risk.}, journal = {Nat Genet}, volume = {50}, year = {2018}, month = {2018 Sep}, pages = {1327-1334}, abstract = {

Coding variants represent many of the strongest associations between genotype and phenotype; however, they exhibit inter-individual differences in effect, termed {\textquoteright}variable penetrance{\textquoteright}. Here, we study how cis-regulatory variation modifies the penetrance of coding variants. Using functional genomic and genetic data from the Genotype-Tissue Expression Project (GTEx), we observed that in the general population, purifying selection has depleted haplotype combinations predicted to increase pathogenic coding variant penetrance. Conversely, in cancer and autism patients, we observed an enrichment of penetrance increasing haplotype configurations for pathogenic variants in disease-implicated genes, providing evidence that regulatory haplotype configuration of coding variants affects disease risk. Finally, we experimentally validated this model by editing a Mendelian single-nucleotide polymorphism (SNP) using CRISPR/Cas9 on distinct expression haplotypes with the transcriptome as a phenotypic readout. Our results demonstrate that joint regulatory and coding variant effects are an important part of the genetic architecture of human traits and contribute to modified penetrance of disease-causing variants.

}, issn = {1546-1718}, doi = {10.1038/s41588-018-0192-y}, author = {Castel, Stephane E and Cervera, Alejandra and Mohammadi, Pejman and Aguet, Fran{\c c}ois and Reverter, Ferran and Wolman, Aaron and Guigo, Roderic and Iossifov, Ivan and Vasileva, Ana and Lappalainen, Tuuli} }