@article {124, title = {Chromosome-scale, haplotype-resolved assembly of human genomes.}, journal = {Nat Biotechnol}, volume = {39}, year = {2021}, month = {2021 03}, pages = {309-312}, abstract = {

Haplotype-resolved or phased genome assembly provides a complete picture of genomes and their complex genetic variations. However, current algorithms for phased assembly either do not generate chromosome-scale phasing or require pedigree information, which limits their application. We present a method named diploid assembly (DipAsm) that uses long, accurate reads and long-range conformation data for single individuals to generate a chromosome-scale phased assembly within 1 day. Applied to four public human genomes, PGP1, HG002, NA12878 and HG00733, DipAsm produced haplotype-resolved assemblies with minimum contig length needed to cover 50\% of the known genome (NG50) up to 25 Mb and phased ~99.5\% of heterozygous sites at 98-99\% accuracy, outperforming other approaches in terms of both contiguity and phasing completeness. We demonstrate the importance of chromosome-scale phased assemblies for the discovery of structural variants (SVs), including thousands of new transposon insertions, and of highly polymorphic and medically important regions such as the human leukocyte antigen (HLA) and killer cell immunoglobulin-like receptor (KIR) regions. DipAsm will facilitate high-quality precision medicine and studies of individual haplotype variation and population diversity.

}, keywords = {Algorithms, Chromosomes, Human, Genome, Human, Haplotypes, Heterozygote, Humans, Polymorphism, Single Nucleotide}, issn = {1546-1696}, doi = {10.1038/s41587-020-0711-0}, author = {Garg, Shilpa and Fungtammasan, Arkarachai and Carroll, Andrew and Chou, Mike and Schmitt, Anthony and Zhou, Xiang and Mac, Stephen and Peluso, Paul and Hatas, Emily and Ghurye, Jay and Maguire, Jared and Mahmoud, Medhat and Cheng, Haoyu and Heller, David and Zook, Justin M and Moemke, Tobias and Marschall, Tobias and Sedlazeck, Fritz J and Aach, John and Chin, Chen-Shan and Church, George M and Li, Heng} } @article {78, title = {Accurate circular consensus long-read sequencing improves variant detection and assembly of a human genome.}, journal = {Nat Biotechnol}, volume = {37}, year = {2019}, month = {2019 Oct}, pages = {1155-1162}, abstract = {

The DNA sequencing technologies in use today produce either highly accurate short reads or less-accurate long reads. We report the optimization of circular consensus sequencing (CCS) to improve the accuracy of single-molecule real-time (SMRT) sequencing (PacBio) and generate highly accurate (99.8\%) long high-fidelity (HiFi) reads with an average length of 13.5 kilobases (kb). We applied our approach to sequence the well-characterized human HG002/NA24385 genome and obtained precision and recall rates of at least 99.91\% for single-nucleotide variants (SNVs), 95.98\% for insertions and deletions <50 bp (indels) and 95.99\% for structural variants. Our CCS method matches or exceeds the ability of short-read sequencing to detect small variants and structural variants. We estimate that 2,434 discordances are correctable mistakes in the {\textquoteright}genome in a bottle{\textquoteright} (GIAB) benchmark set. Nearly all (99.64\%) variants can be phased into haplotypes, further improving variant detection. De novo genome assembly using CCS reads alone produced a contiguous and accurate genome with a contig N50 of >15 megabases (Mb) and concordance of 99.997\%, substantially outperforming assembly with less-accurate long reads.

}, issn = {1546-1696}, doi = {10.1038/s41587-019-0217-9}, author = {Wenger, Aaron M and Peluso, Paul and Rowell, William J and Chang, Pi-Chuan and Hall, Richard J and Concepcion, Gregory T and Ebler, Jana and Fungtammasan, Arkarachai and Kolesnikov, Alexey and Olson, Nathan D and T{\"o}pfer, Armin and Alonge, Michael and Mahmoud, Medhat and Qian, Yufeng and Chin, Chen-Shan and Phillippy, Adam M and Schatz, Michael C and Myers, Gene and DePristo, Mark A and Ruan, Jue and Marschall, Tobias and Sedlazeck, Fritz J and Zook, Justin M and Li, Heng and Koren, Sergey and Carroll, Andrew and Rank, David R and Hunkapiller, Michael W} }