Repetitive sequences make up a significant fraction of almost any genome, and an important and still open question in bioinformatics is how to represent all repeats in DNA sequences. We propose a new approach to repeat classification that represents all repeats in a genome as a mosaic of sub-repeats. Our key algorithmic idea also leads to new approaches to multiple alignment and fragment assembly. In particular, we show that our FragmentGluer assembler improves on Phrap and ARACHNE in assembly of BACs and bacterial genomes.
%0 Journal Article
%1 Pevzner:2004aa
%A Pevzner, Pavel A
%A Pevzner, Paul A
%A Tang, Haixu
%A Tesler, Glenn
%D 2004
%J Genome Res
%K (Genetics), Acid, Algorithms, Alignment, Analysis, Artificial, Bacterial, Biology, Chromosomes, Cluster Computational Contig Family Genome, Human, Humans, Linkage Mapping, Multigene Nucleic Repetitive Sequence Sequences,
%N 9
%P 1786--96
%R 10.1101/gr.2395204
%T De novo repeat classification and fragment assembly
%V 14
%X Repetitive sequences make up a significant fraction of almost any genome, and an important and still open question in bioinformatics is how to represent all repeats in DNA sequences. We propose a new approach to repeat classification that represents all repeats in a genome as a mosaic of sub-repeats. Our key algorithmic idea also leads to new approaches to multiple alignment and fragment assembly. In particular, we show that our FragmentGluer assembler improves on Phrap and ARACHNE in assembly of BACs and bacterial genomes.
@article{Pevzner:2004aa,
abstract = {Repetitive sequences make up a significant fraction of almost any genome, and an important and still open question in bioinformatics is how to represent all repeats in DNA sequences. We propose a new approach to repeat classification that represents all repeats in a genome as a mosaic of sub-repeats. Our key algorithmic idea also leads to new approaches to multiple alignment and fragment assembly. In particular, we show that our FragmentGluer assembler improves on Phrap and ARACHNE in assembly of BACs and bacterial genomes.},
added-at = {2007-09-17T20:19:41.000+0200},
affiliation = {Department of Computer Science and Engineering, University of California, San Diego, La Jolla, California 92093, USA.},
author = {Pevzner, Pavel A and Pevzner, Paul A and Tang, Haixu and Tesler, Glenn},
biburl = {https://www.bibsonomy.org/bibtex/251d90db8174d7d1da830b654951e5ea0/dzerbino},
doi = {10.1101/gr.2395204},
interhash = {181b5dccc85c51d1fe0009ae53cbed00},
intrahash = {51d90db8174d7d1da830b654951e5ea0},
issue = {9},
journal = {Genome Res},
keywords = {(Genetics), Acid, Algorithms, Alignment, Analysis, Artificial, Bacterial, Biology, Chromosomes, Cluster Computational Contig Family Genome, Human, Humans, Linkage Mapping, Multigene Nucleic Repetitive Sequence Sequences,},
language = {English},
local-url = {file://localhost/Users/danielzerbino/Documents/Papers/2004/Pevzner/Genome%20Res%202004%20Pevzner.pdf},
month = Sep,
number = 9,
pages = {1786--96},
pii = {14/9/1786},
pmid = {15342561},
timestamp = {2007-09-17T20:19:43.000+0200},
title = {De novo repeat classification and fragment assembly},
uri = {papers://055852FE-1648-42FE-91D0-8CA474D2B905/Paper/p26},
volume = 14,
year = 2004
}