@article {49535, title = {Genomic analysis of sequence-dependent DNA curvature in Leishmania.}, volume = {8}, year = {2013}, month = {2013}, pages = {e63068}, abstract = {

Leishmania major is a flagellated protozoan parasite of medical importance. Like other members of the Trypanosomatidae family, it possesses unique mechanisms of gene expression such as constitutive polycistronic transcription of directional gene clusters, gene amplification, mRNA trans-splicing, and extensive editing of mitochondrial transcripts. The molecular signals underlying most of these processes remain under investigation. In order to investigate the role of DNA secondary structure signals in gene expression, we carried out a genome-wide in silico analysis of the intrinsic DNA curvature. The L. major genome revealed a lower frequency of high intrinsic curvature regions as well as inter- and intra- chromosomal distribution heterogeneity, when compared to prokaryotic and eukaryotic organisms. Using a novel method aimed at detecting region-integrated intrinsic curvature (RIIC), high DNA curvature was found to be associated with regions implicated in transcription initiation. Those include divergent strand-switch regions between directional gene clusters and regions linked to markers of active transcription initiation such as acetylated H3 histone, TRF4 and SNAP50. These findings suggest a role for DNA curvature in transcription initiation in Leishmania supporting the relevance of DNA secondary structures signals.

}, keywords = {Chromosome mapping, Comparative Genomic Hybridization, Computational Biology, DNA, Protozoan, Genome, Protozoan, Genomics, HUMANS, Leishmania, Nucleic Acid Conformation}, issn = {1932-6203}, doi = {10.1371/journal.pone.0063068}, author = {Smircich, Pablo and Forteza, Diego and El-Sayed, Najib M and Garat, Beatriz} } @article {49652, title = {The genome and its implications.}, journal = {Adv Parasitol}, volume = {75}, year = {2011}, month = {2011}, pages = {209-30}, abstract = {

Trypanosoma cruzi has a heterogeneous population composed of a pool of strains that circulate in the domestic and sylvatic cycles. Genome sequencing of the clone CL Brener revealed a highly repetitive genome of about 110Mb containing an estimated 22,570 genes. Because of its hybrid nature, sequences representing the two haplotypes have been generated. In addition, a repeat content close to 50\% made the assembly of the estimated 41 pairs of chromosomes quite challenging. Similar to other trypanosomatids, the organization of T. cruzi chromosomes was found to be very peculiar, with protein-coding genes organized in long polycistronic transcription units encoding 20 or more proteins in one strand separated by strand switch regions. Another remarkable feature of the T. cruzi genome is the massive expansion of surface protein gene families. Because of the high genetic diversity of the T. cruzi population, sequencing of additional strains and comparative genomic and transcriptome analyses are in progress. Five years after its publication, the genome data have proven to be an essential tool for the study of T. cruzi and increasing efforts to translate this knowledge into the development of new modes of intervention to control Chagas disease are underway.

}, keywords = {Animals, Antigens, Protozoan, Chagas Disease, Chromosomes, Comparative Genomic Hybridization, DNA, Protozoan, Gene Expression Regulation, Genetic Variation, Genome, Protozoan, Host-Parasite Interactions, HUMANS, Species Specificity, Synteny, Transcription, Genetic, Transfection, Trypanosoma cruzi}, issn = {0065-308X}, doi = {10.1016/B978-0-12-385863-4.00010-1}, author = {Teixeira, Santuza M and El-Sayed, Najib M and Ara{\'u}jo, Patr{\'\i}cia R} } @article {49639, title = {The Trypanosoma cruzi L1Tc and NARTc non-LTR retrotransposons show relative site specificity for insertion.}, journal = {Mol Biol Evol}, volume = {23}, year = {2006}, month = {2006 Feb}, pages = {411-20}, abstract = {

The trypanosomatid protozoan Trypanosoma cruzi contains long autonomous (L1Tc) and short nonautonomous (NARTc) non-long terminal repeat retrotransposons. NARTc (0.25 kb) probably derived from L1Tc (4.9 kb) by 3{\textquoteright}-deletion. It has been proposed that their apparent random distribution in the genome is related to the L1Tc-encoded apurinic/apyrimidinic endonuclease (APE) activity, which repairs modified residues. To address this question we used the T. cruzi (CL-Brener strain) genome data to analyze the distribution of all the L1Tc/NARTc elements present in contigs larger than 10 kb. This data set, which represents 0.91x sequence coverage of the haploid nuclear genome ( approximately 55 Mb), contains 419 elements, including 112 full-length L1Tc elements (14 of which are potentially functional) and 84 full-length NARTc. Approximately half of the full-length elements are flanked by a target site duplication, most of them (87\%) are 12 bp long. Statistical analyses of sequences flanking the full-length elements show the same highly conserved pattern upstream of both the L1Tc and NARTc retrotransposons. The two most conserved residues are a guanine and an adenine, which flank the site where first-strand cleavage is performed by the element-encoded endonuclease activity. This analysis clearly indicates that the L1Tc and NARTc elements display relative site specificity for insertion, which suggests that the APE activity is not responsible for first-strand cleavage of the target site.

}, keywords = {Animals, DNA, Protozoan, DNA-(Apurinic or Apyrimidinic Site) Lyase, Mutagenesis, Insertional, Retroelements, Sequence Deletion, Trypanosoma cruzi}, issn = {0737-4038}, doi = {10.1093/molbev/msj046}, author = {Bringaud, Frederic and Bartholomeu, Daniella C and Blandin, Ga{\"e}lle and Delcher, Arthur and Baltz, Th{\'e}o and el-Sayed, Najib M A and Ghedin, Elodie} } @article {49636, title = {Telomere and subtelomere of Trypanosoma cruzi chromosomes are enriched in (pseudo)genes of retrotransposon hot spot and trans-sialidase-like gene families: the origins of T. cruzi telomeres.}, journal = {Gene}, volume = {346}, year = {2005}, month = {2005 Feb 14}, pages = {153-61}, abstract = {

Here, we sequenced two large telomeric regions obtained from the pathogen protozoan Trypanosoma cruzi. These sequences, together with in silico assembled contigs, allowed us to establish the general features of telomeres and subtelomeres of this parasite. Our findings can be summarized as follows: We confirmed the presence of two types of telomeric ends; subtelomeric regions appeared to be enriched in (pseudo)genes of RHS (retrotransposon hot spot), TS (trans-sialidase)-like proteins, and putative surface protein DGF-1 (dispersed gene family-1). Sequence analysis of the ts-like genes located at the telomeres suggested that T. cruzi chromosomal ends could have been the site for generation of new gp85 variants, an important adhesin molecule involved in the invasion of mammalian cells by T. cruzi. Finally, a mechanism for generation of T. cruzi telomere by chromosome breakage and telomere healing is proposed.

}, keywords = {Amino Acid Sequence, Animals, Base Sequence, Chromosomes, Chromosomes, Artificial, Bacterial, DNA, Protozoan, Genes, Protozoan, Glycoproteins, Molecular Sequence Data, Multigene Family, Neuraminidase, Pseudogenes, Retroelements, Sequence Homology, Amino Acid, Sequence Homology, Nucleic Acid, Telomere, Trypanosoma cruzi}, issn = {0378-1119}, doi = {10.1016/j.gene.2004.10.014}, author = {Kim, Dong and Chiurillo, Miguel Angel and El-Sayed, Najib and Jones, Kristin and Santos, M{\'a}rcia R M and Porcile, Patricio E and Andersson, Bj{\"o}rn and Myler, Peter and da Silveira, Jose Franco and Ram{\'\i}rez, Jos{\'e} Luis} } @article {49633, title = {The sequence and analysis of Trypanosoma brucei chromosome II.}, journal = {Nucleic Acids Res}, volume = {31}, year = {2003}, month = {2003 Aug 15}, pages = {4856-63}, abstract = {

We report here the sequence of chromosome II from Trypanosoma brucei, the causative agent of African sleeping sickness. The 1.2-Mb pairs encode about 470 predicted genes organised in 17 directional clusters on either strand, the largest cluster of which has 92 genes lined up over a 284-kb region. An analysis of the GC skew reveals strand compositional asymmetries that coincide with the distribution of protein-coding genes, suggesting these asymmetries may be the result of transcription-coupled repair on coding versus non-coding strand. A 5-cM genetic map of the chromosome reveals recombinational {\textquoteright}hot{\textquoteright} and {\textquoteright}cold{\textquoteright} regions, the latter of which is predicted to include the putative centromere. One end of the chromosome consists of a 250-kb region almost exclusively composed of RHS (pseudo)genes that belong to a newly characterised multigene family containing a hot spot of insertion for retroelements. Interspersed with the RHS genes are a few copies of truncated RNA polymerase pseudogenes as well as expression site associated (pseudo)genes (ESAGs) 3 and 4, and 76 bp repeats. These features are reminiscent of a vestigial variant surface glycoprotein (VSG) gene expression site. The other end of the chromosome contains a 30-kb array of VSG genes, the majority of which are pseudogenes, suggesting that this region may be a site for modular de novo construction of VSG gene diversity during transposition/gene conversion events.

}, keywords = {Animals, Antigens, Protozoan, Chromosome mapping, Chromosomes, DNA, Protozoan, Gene Duplication, Genes, Protozoan, Molecular Sequence Data, Pseudogenes, Recombination, Genetic, Sequence Analysis, DNA, Trypanosoma brucei brucei}, issn = {1362-4962}, author = {el-Sayed, Najib M A and Ghedin, Elodie and Song, Jinming and MacLeod, Annette and Bringaud, Frederic and Larkin, Christopher and Wanless, David and Peterson, Jeremy and Hou, Lihua and Taylor, Sonya and Tweedie, Alison and Biteau, Nicolas and Khalak, Hanif G and Lin, Xiaoying and Mason, Tanya and Hannick, Linda and Caler, Elisabet and Blandin, Ga{\"e}lle and Bartholomeu, Daniella and Simpson, Anjana J and Kaul, Samir and Zhao, Hong and Pai, Grace and Van Aken, Susan and Utterback, Teresa and Haas, Brian and Koo, Hean L and Umayam, Lowell and Suh, Bernard and Gerrard, Caroline and Leech, Vanessa and Qi, Rong and Zhou, Shiguo and Schwartz, David and Feldblyum, Tamara and Salzberg, Steven and Tait, Andrew and Turner, C Michael R and Ullu, Elisabetta and White, Owen and Melville, Sara and Adams, Mark D and Fraser, Claire M and Donelson, John E} } @article {38304, title = {Genome sequence of the human malaria parasite Plasmodium falciparum}, journal = {NatureNature}, volume = {419}, year = {2002}, note = {http://www.ncbi.nlm.nih.gov/pubmed/12368864?dopt=Abstract}, type = {10.1038/nature01097}, abstract = {The parasite Plasmodium falciparum is responsible for hundreds of millions of cases of malaria, and kills more than one million African children annually. Here we report an analysis of the genome sequence of P. falciparum clone 3D7. The 23-megabase nuclear genome consists of 14 chromosomes, encodes about 5,300 genes, and is the most (A + T)-rich genome sequenced to date. Genes involved in antigenic variation are concentrated in the subtelomeric regions of the chromosomes. Compared to the genomes of free-living eukaryotic microbes, the genome of this intracellular parasite encodes fewer enzymes and transporters, but a large proportion of genes are devoted to immune evasion and host-parasite interactions. Many nuclear-encoded proteins are targeted to the apicoplast, an organelle involved in fatty-acid and isoprenoid metabolism. The genome sequence provides the foundation for future studies of this organism, and is being exploited in the search for new drugs and vaccines to fight malaria.}, keywords = {Animals, Chromosome Structures, DNA Repair, DNA Replication, DNA, Protozoan, Evolution, Molecular, Genome, Protozoan, HUMANS, Malaria Vaccines, Malaria, Falciparum, Membrane Transport Proteins, Molecular Sequence Data, Plasmodium falciparum, Plastids, Proteome, Protozoan Proteins, Recombination, Genetic, Sequence Analysis, DNA}, author = {Gardner, Malcolm J. and Hall, Neil and Fung, Eula and White, Owen and Berriman, Matthew and Hyman, Richard W. and Carlton, Jane M. and Pain, Arnab and Nelson, Karen E. and Bowman, Sharen and Paulsen, Ian T. and James, Keith and Eisen, Jonathan A. and Rutherford, Kim and Salzberg, Steven L. and Craig, Alister and Kyes, Sue and Chan, Man-Suen and Nene, Vishvanath and Shallom, Shamira J. and Suh, Bernard and Peterson, Jeremy and Angiuoli, Sam and Pertea, Mihaela and Allen, Jonathan and J. Selengut and Haft, Daniel and Mather, Michael W. and Vaidya, Akhil B. and Martin, David M. A. and Fairlamb, Alan H. and Fraunholz, Martin J. and Roos, David S. and Ralph, Stuart A. and McFadden, Geoffrey I. and Cummings, Leda M. and Subramanian, G. Mani and Mungall, Chris and Venter, J. Craig and Carucci, Daniel J. and Hoffman, Stephen L. and Newbold, Chris and Davis, Ronald W. and Fraser, Claire M. and Barrell, Bart} } @article {49631, title = {A new, expressed multigene family containing a hot spot for insertion of retroelements is associated with polymorphic subtelomeric regions of Trypanosoma brucei.}, journal = {Eukaryot Cell}, volume = {1}, year = {2002}, month = {2002 Feb}, pages = {137-51}, abstract = {

We describe a novel gene family that forms clusters in subtelomeric regions of Trypanosoma brucei chromosomes and partially accounts for the observed clustering of retrotransposons. The ingi and ribosomal inserted mobile element (RIME) non-LTR retrotransposons share 250 bp at both extremities and are the most abundant putatively mobile elements, with about 500 copies per haploid genome. From cDNA clones and subsequently in the T. brucei genomic DNA databases, we identified 52 homologous gene and pseudogene sequences, 16 of which contain a RIME and/or ingi retrotransposon inserted at exactly the same relative position. Here these genes are called the RHS family, for retrotransposon hot spot. Comparison of the protein sequences encoded by RHS genes (21 copies) and pseudogenes (24 copies) revealed a conserved central region containing an ATP/GTP-binding motif and the RIME/ingi insertion site. The RHS proteins share between 13 and 96\% identity, and six subfamilies, RHS1 to RHS6, can be defined on the basis of their divergent C-terminal domains. Immunofluorescence and Western blot analyses using RHS subfamily-specific immune sera show that RHS proteins are constitutively expressed and occur mainly in the nucleus. Analysis of Genome Survey Sequence databases indicated that the Trypanosoma brucei diploid genome contains about 280 RHS (pseudo)genes. Among the 52 identified RHS (pseudo)genes, 48 copies are in three RHS clusters located in subtelomeric regions of chromosomes Ia and II and adjacent to the active bloodstream form expression site in T. brucei strain TREU927/4 GUTat10.1. RHS genes comprise the remaining sequence of the size-polymorphic "repetitive region" described for T. brucei chromosome I, and a homologous gene family is present in the Trypanosoma cruzi genome.

}, keywords = {Amino Acid Sequence, Animals, Base Sequence, Cloning, Molecular, DNA Primers, DNA, Protozoan, Escherichia coli, Genes, Protozoan, Molecular Sequence Data, Multigene Family, Mutagenesis, Insertional, Phylogeny, Polymorphism, Genetic, Protozoan Proteins, Pseudogenes, Retroelements, sequence alignment, Sequence Homology, Amino Acid, Telomere, Trypanosoma brucei brucei, Trypanosoma cruzi}, issn = {1535-9778}, author = {Bringaud, Frederic and Biteau, Nicolas and Melville, Sara E and Hez, St{\'e}phanie and El-Sayed, Najib M and Leech, Vanessa and Berriman, Matthew and Hall, Neil and Donelson, John E and Baltz, Th{\'e}o} } @article {38492, title = {Sequence of Plasmodium falciparum chromosomes 2, 10, 11 and 14}, journal = {NatureNature}, volume = {419}, year = {2002}, note = {http://www.ncbi.nlm.nih.gov/pubmed/12368868?dopt=Abstract}, type = {10.1038/nature01094}, abstract = {The mosquito-borne malaria parasite Plasmodium falciparum kills an estimated 0.7-2.7 million people every year, primarily children in sub-Saharan Africa. Without effective interventions, a variety of factors-including the spread of parasites resistant to antimalarial drugs and the increasing insecticide resistance of mosquitoes-may cause the number of malaria cases to double over the next two decades. To stimulate basic research and facilitate the development of new drugs and vaccines, the genome of Plasmodium falciparum clone 3D7 has been sequenced using a chromosome-by-chromosome shotgun strategy. We report here the nucleotide sequences of chromosomes 10, 11 and 14, and a re-analysis of the chromosome 2 sequence. These chromosomes represent about 35\% of the 23-megabase P. falciparum genome.}, keywords = {Animals, Chromosomes, DNA, Protozoan, Genome, Protozoan, Plasmodium falciparum, Proteome, Protozoan Proteins, Sequence Analysis, DNA}, author = {Gardner, Malcolm J. and Shallom, Shamira J. and Carlton, Jane M. and Salzberg, Steven L. and Nene, Vishvanath and Shoaibi, Azadeh and Ciecko, Anne and Lynn, Jeffery and Rizzo, Michael and Weaver, Bruce and Jarrahi, Behnam and Brenner, Michael and Parvizi, Babak and Tallon, Luke and Moazzez, Azita and Granger, David and Fujii, Claire and Hansen, Cheryl and Pederson, James and Feldblyum, Tamara and Peterson, Jeremy and Suh, Bernard and Angiuoli, Sam and Pertea, Mihaela and Allen, Jonathan and J. Selengut and White, Owen and Cummings, Leda M. and Smith, Hamilton O. and Adams, Mark D. and Venter, J. Craig and Carucci, Daniel J. and Hoffman, Stephen L. and Fraser, Claire M.} } @article {49632, title = {Trypanosoma cruzi: RNA structure and post-transcriptional control of tubulin gene expression.}, journal = {Exp Parasitol}, volume = {102}, year = {2002}, month = {2002 Nov-Dec}, pages = {123-33}, abstract = {

Changes in tubulin expression are among the biochemical and morphological adaptations that occur during the life cycle of Trypanosomatids. To investigate the mechanism responsible for the differential accumulation of tubulin mRNAs in Trypanosoma cruzi, we determine the sequences of alpha- and beta-tubulin transcripts and analyzed their expression during the life cycle of the parasite. Two beta-tubulin mRNAs of 1.9 and 2.3 kb were found to differ mainly by an additional 369 nucleotides at the end of the 3{\textquoteright} untranslated region (UTR). Although their transcription rates are similar in epimastigotes and amastigotes, alpha- and beta-tubulin transcripts are 3- to 6-fold more abundant in epimastigotes than in trypomastigotes and amastigotes. Accordingly, the half-lives of alpha- and beta-tubulin mRNAs are significantly higher in epimastigotes than in amastigotes. Transient transfection experiments indicated that positive regulatory elements occur in the 3{\textquoteright} UTR plus downstream intergenic region of the alpha-tubulin gene and that both positive and negative elements occur in the equivalent regions of the beta-tubulin gene.

}, keywords = {Animals, Base Sequence, Blotting, Northern, DNA, Complementary, DNA, Protozoan, Gene Expression Regulation, Half-Life, Life Cycle Stages, Molecular Sequence Data, RNA Processing, Post-Transcriptional, RNA, Messenger, RNA, Protozoan, Transcription, Genetic, Transfection, Trypanosoma cruzi, Tubulin}, issn = {0014-4894}, author = {Bartholomeu, Daniella C and Silva, Rosiane A and Galv{\~a}o, Lucia M C and el-Sayed, Najib M A and Donelson, John E and Teixeira, Santuza M R} }