@article {49535, title = {Genomic analysis of sequence-dependent DNA curvature in Leishmania.}, volume = {8}, year = {2013}, month = {2013}, pages = {e63068}, abstract = {

Leishmania major is a flagellated protozoan parasite of medical importance. Like other members of the Trypanosomatidae family, it possesses unique mechanisms of gene expression such as constitutive polycistronic transcription of directional gene clusters, gene amplification, mRNA trans-splicing, and extensive editing of mitochondrial transcripts. The molecular signals underlying most of these processes remain under investigation. In order to investigate the role of DNA secondary structure signals in gene expression, we carried out a genome-wide in silico analysis of the intrinsic DNA curvature. The L. major genome revealed a lower frequency of high intrinsic curvature regions as well as inter- and intra- chromosomal distribution heterogeneity, when compared to prokaryotic and eukaryotic organisms. Using a novel method aimed at detecting region-integrated intrinsic curvature (RIIC), high DNA curvature was found to be associated with regions implicated in transcription initiation. Those include divergent strand-switch regions between directional gene clusters and regions linked to markers of active transcription initiation such as acetylated H3 histone, TRF4 and SNAP50. These findings suggest a role for DNA curvature in transcription initiation in Leishmania supporting the relevance of DNA secondary structures signals.

}, keywords = {Chromosome mapping, Comparative Genomic Hybridization, Computational Biology, DNA, Protozoan, Genome, Protozoan, Genomics, HUMANS, Leishmania, Nucleic Acid Conformation}, issn = {1932-6203}, doi = {10.1371/journal.pone.0063068}, author = {Smircich, Pablo and Forteza, Diego and El-Sayed, Najib M and Garat, Beatriz} } @article {49653, title = {Functional genomics of trypanosomatids.}, journal = {Parasite Immunol}, volume = {34}, year = {2012}, month = {2012 Feb-Mar}, pages = {72-9}, abstract = {

The decoding of the Tritryp reference genomes nearly 7 years ago provided a first peek into the biology of pathogenic trypanosomatids and a blueprint that has paved the way for genome-wide studies. Although 60-70\% of the predicted protein coding genes in Trypanosoma brucei, Trypanosoma cruzi and Leishmania major remain unannotated, the functional genomics landscape is rapidly changing. Facilitated by the advent of next-generation sequencing technologies, improved structural and functional annotation and genes and their products are emerging. Information is also growing for the interactions between cellular components as transcriptomes, regulatory networks and metabolomes are characterized, ushering in a new era of systems biology. Simultaneously, the launch of comparative sequencing of multiple strains of kinetoplastids will finally lead to the investigation of a vast, yet to be explored, evolutionary and pathogenomic space.

}, keywords = {Animals, Genome, Protozoan, Genomics, HUMANS, Proteome, Protozoan Proteins, Transcriptome, Trypanosomatina}, issn = {1365-3024}, doi = {10.1111/j.1365-3024.2011.01347.x}, author = {Choi, J and El-Sayed, N M} } @article {49652, title = {The genome and its implications.}, journal = {Adv Parasitol}, volume = {75}, year = {2011}, month = {2011}, pages = {209-30}, abstract = {

Trypanosoma cruzi has a heterogeneous population composed of a pool of strains that circulate in the domestic and sylvatic cycles. Genome sequencing of the clone CL Brener revealed a highly repetitive genome of about 110Mb containing an estimated 22,570 genes. Because of its hybrid nature, sequences representing the two haplotypes have been generated. In addition, a repeat content close to 50\% made the assembly of the estimated 41 pairs of chromosomes quite challenging. Similar to other trypanosomatids, the organization of T. cruzi chromosomes was found to be very peculiar, with protein-coding genes organized in long polycistronic transcription units encoding 20 or more proteins in one strand separated by strand switch regions. Another remarkable feature of the T. cruzi genome is the massive expansion of surface protein gene families. Because of the high genetic diversity of the T. cruzi population, sequencing of additional strains and comparative genomic and transcriptome analyses are in progress. Five years after its publication, the genome data have proven to be an essential tool for the study of T. cruzi and increasing efforts to translate this knowledge into the development of new modes of intervention to control Chagas disease are underway.

}, keywords = {Animals, Antigens, Protozoan, Chagas Disease, Chromosomes, Comparative Genomic Hybridization, DNA, Protozoan, Gene Expression Regulation, Genetic Variation, Genome, Protozoan, Host-Parasite Interactions, HUMANS, Species Specificity, Synteny, Transcription, Genetic, Transfection, Trypanosoma cruzi}, issn = {0065-308X}, doi = {10.1016/B978-0-12-385863-4.00010-1}, author = {Teixeira, Santuza M and El-Sayed, Najib M and Ara{\'u}jo, Patr{\'\i}cia R} } @article {49644, title = {Genomic organization and expression profile of the mucin-associated surface protein (masp) family of the human pathogen Trypanosoma cruzi.}, journal = {Nucleic Acids Res}, volume = {37}, year = {2009}, month = {2009 Jun}, pages = {3407-17}, abstract = {

A novel large multigene family was recently identified in the human pathogen Trypanosoma cruzi, causative agent of Chagas disease, and corresponds to approximately 6\% of the parasite diploid genome. The predicted gene products, mucin-associated surface proteins (MASPs), are characterized by highly conserved N- and C-terminal domains and a strikingly variable and repetitive central region. We report here an analysis of the genomic organization and expression profile of masp genes. Masps are not randomly distributed throughout the genome but instead are clustered with genes encoding mucin and other surface protein families. Masp transcripts vary in size, are preferentially expressed during the trypomastigote stage and contain highly conserved 5{\textquoteright} and 3{\textquoteright} untranslated regions. A sequence analysis of a trypomastigote cDNA library reveals the expression of multiple masp variants with a bias towards a particular masp subgroup. Immunofluorescence assays using antibodies generated against a MASP peptide reveals that the expression of particular MASPs at the cell membrane is limited to subsets of the parasite population. Western blots of phosphatidylinositol-specific phospholipase C (PI-PLC)-treated parasites suggest that MASP may be GPI-anchored and shed into the medium culture, thus contributing to the large repertoire of parasite polypeptides that are exposed to the host immune system.

}, keywords = {3{\textquoteright} Flanking Region, 5{\textquoteright} Flanking Region, Amino Acid Sequence, Animals, Base Sequence, Conserved Sequence, Gene Expression Profiling, Genes, Protozoan, Genome, Protozoan, Membrane Proteins, Molecular Sequence Data, Mucins, Multigene Family, Protozoan Proteins, RNA, Messenger, Trypanosoma cruzi}, issn = {1362-4962}, doi = {10.1093/nar/gkp172}, author = {Bartholomeu, Daniella C and Cerqueira, Gustavo C and Le{\~a}o, Ana Carolina A and daRocha, Wanderson D and Pais, Fabiano S and Macedo, Camila and Djikeng, Appolinaire and Teixeira, Santuza M R and El-Sayed, Najib M} } @article {49642, title = {Members of a large retroposon family are determinants of post-transcriptional gene expression in Leishmania.}, journal = {PLoS Pathog}, volume = {3}, year = {2007}, month = {2007 Sep 7}, pages = {1291-307}, abstract = {

Trypanosomatids are unicellular protists that include the human pathogens Leishmania spp. (leishmaniasis), Trypanosoma brucei (sleeping sickness), and Trypanosoma cruzi (Chagas disease). Analysis of their recently completed genomes confirmed the presence of non-long-terminal repeat retrotransposons, also called retroposons. Using the 79-bp signature sequence common to all trypanosomatid retroposons as bait, we identified in the Leishmania major genome two new large families of small elements--LmSIDER1 (785 copies) and LmSIDER2 (1,073 copies)--that fulfill all the characteristics of extinct trypanosomatid retroposons. LmSIDERs are approximately 70 times more abundant in L. major compared to T. brucei and are found almost exclusively within the 3{\textquoteright}-untranslated regions (3{\textquoteright}UTRs) of L. major mRNAs. We provide experimental evidence that LmSIDER2 act as mRNA instability elements and that LmSIDER2-containing mRNAs are generally expressed at lower levels compared to the non-LmSIDER2 mRNAs. The considerable expansion of LmSIDERs within 3{\textquoteright}UTRs in an organism lacking transcriptional control and their role in regulating mRNA stability indicate that Leishmania have probably recycled these short retroposons to globally modulate the expression of a number of genes. To our knowledge, this is the first example in eukaryotes of the domestication and expansion of a family of mobile elements that have evolved to fulfill a critical cellular function.

}, keywords = {3{\textquoteright} Untranslated Regions, Animals, Base Sequence, Biological Evolution, Down-Regulation, Gene Expression Regulation, Genome, Protozoan, Leishmania, Leishmania major, Molecular Sequence Data, Retroelements, RNA, Messenger, sequence alignment, Trypanosoma brucei brucei, Trypanosoma cruzi}, issn = {1553-7374}, doi = {10.1371/journal.ppat.0030136}, author = {Bringaud, Frederic and M{\"u}ller, Michaela and Cerqueira, Gustavo Coutinho and Smith, Martin and Rochette, Annie and el-Sayed, Najib M A and Papadopoulou, Barbara and Ghedin, Elodie} } @article {49635, title = {Gene synteny and evolution of genome architecture in trypanosomatids.}, journal = {Mol Biochem Parasitol}, volume = {134}, year = {2004}, month = {2004 Apr}, pages = {183-91}, abstract = {

The trypanosomatid protozoa Trypanosoma brucei, Trypanosoma cruzi and Leishmania major are related human pathogens that cause markedly distinct diseases. Using information from genome sequencing projects currently underway, we have compared the sequences of large chromosomal fragments from each species. Despite high levels of divergence at the sequence level, these three species exhibit a striking conservation of gene order, suggesting that selection has maintained gene order among the trypanosomatids over hundreds of millions of years of evolution. The few sites of genome rearrangement between these species are marked by the presence of retrotransposon-like elements, suggesting that retrotransposons may have played an important role in shaping trypanosomatid genome organization. A degenerate retroelement was identified in L. major by examining the regions near breakage points of the synteny. This is the first such element found in L. major suggesting that retroelements were found in the common ancestor of all three species.

}, keywords = {Animals, Computational Biology, Evolution, Molecular, Gene Order, Genome, Protozoan, Genomics, Leishmania major, Multigene Family, Recombination, Genetic, Retroelements, Selection, Genetic, Synteny, Trypanosoma brucei brucei, Trypanosoma cruzi, Trypanosomatina}, issn = {0166-6851}, doi = {10.1016/j.molbiopara.2003.11.012}, author = {Ghedin, Elodie and Bringaud, Frederic and Peterson, Jeremy and Myler, Peter and Berriman, Matthew and Ivens, Alasdair and Andersson, Bj{\"o}rn and Bontempi, Esteban and Eisen, Jonathan and Angiuoli, Sam and Wanless, David and Von Arx, Anna and Murphy, Lee and Lennard, Nicola and Salzberg, Steven and Adams, Mark D and White, Owen and Hall, Neil and Stuart, Kenneth and Fraser, Claire M and el-Sayed, Najib M A} } @article {49634, title = {The ingi and RIME non-LTR retrotransposons are not randomly distributed in the genome of Trypanosoma brucei.}, journal = {Mol Biol Evol}, volume = {21}, year = {2004}, month = {2004 Mar}, pages = {520-8}, abstract = {

The ingi (long and autonomous) and RIME (short and nonautonomous) non--long-terminal repeat retrotransposons are the most abundant mobile elements characterized to date in the genome of the African trypanosome Trypanosoma brucei. These retrotransposons were thought to be randomly distributed, but a detailed and comprehensive analysis of their genomic distribution had not been performed until now. To address this question, we analyzed the ingi/RIME sequences and flanking sequences from the ongoing T. brucei genome sequencing project (TREU927/4 strain). Among the 81 ingi/RIME elements analyzed, 60\% are complete, and 7\% of the ingi elements (approximately 15 copies per haploid genome) appear to encode for their own transposition. The size of the direct repeat flanking the ingi/RIME retrotransposons is conserved (i.e., 12-bp), and a strong 11-bp consensus pattern precedes the 5{\textquoteright}-direct repeat. The presence of a consensus pattern upstream of the retroelements was confirmed by the analysis of the base occurrence in 294 GSS containing 5{\textquoteright}-adjacent ingi/RIME sequences. The conserved sequence is present upstream of ingis and RIMEs, suggesting that ingi-encoded enzymatic activities are used for retrotransposition of RIMEs, which are short nonautonomous retroelements. In conclusion, the ingi and RIME retroelements are not randomly distributed in the genome of T. brucei and are preceded by a conserved sequence, which may be the recognition site of the ingi-encoded endonuclease.

}, keywords = {Amino Acid Sequence, Animals, Base Sequence, Consensus Sequence, Genome, Protozoan, Molecular Sequence Data, Retroelements, Sequence Analysis, Trypanosoma brucei brucei}, issn = {0737-4038}, doi = {10.1093/molbev/msh045}, author = {Bringaud, Frederic and Biteau, Nicolas and Zuiderwijk, Eduard and Berriman, Matthew and El-Sayed, Najib M and Ghedin, Elodie and Melville, Sara E and Hall, Neil and Baltz, Th{\'e}o} } @article {49664, title = {Sequencing strategies for parasite genomes.}, journal = {Methods Mol Biol}, volume = {270}, year = {2004}, month = {2004}, pages = {1-16}, abstract = {

Recent advances in the field of sequencing have enabled the determination of the complete nucleotide sequence of a large number of complex genomes. The complete genome sequence of the parasite Plasmodium falciparum has been published recently, and many other parasite genome initiatives are underway. Parasite genomes vary in size, nucleotide composition, polymorphism level, content, and distribution of repetitive elements. These genomic features affect the performance of sequencing strategies. As a consequence, each of the ongoing parasite genome projects has adopted distinct sequencing approaches. The degree of completeness and accuracy desired as well as available funds should be considered carefully when choosing the most appropriate sequencing strategy.

}, keywords = {Animals, Chromosome Walking, Chromosomes, Artificial, Bacterial, Genetic Markers, Genome, Protozoan, Plasmodium falciparum}, issn = {1064-3745}, doi = {10.1385/1-59259-793-9:001}, author = {Bartholomeu, Daniella and El-Sayed, Najib M} } @article {38304, title = {Genome sequence of the human malaria parasite Plasmodium falciparum}, journal = {NatureNature}, volume = {419}, year = {2002}, note = {http://www.ncbi.nlm.nih.gov/pubmed/12368864?dopt=Abstract}, type = {10.1038/nature01097}, abstract = {The parasite Plasmodium falciparum is responsible for hundreds of millions of cases of malaria, and kills more than one million African children annually. Here we report an analysis of the genome sequence of P. falciparum clone 3D7. The 23-megabase nuclear genome consists of 14 chromosomes, encodes about 5,300 genes, and is the most (A + T)-rich genome sequenced to date. Genes involved in antigenic variation are concentrated in the subtelomeric regions of the chromosomes. Compared to the genomes of free-living eukaryotic microbes, the genome of this intracellular parasite encodes fewer enzymes and transporters, but a large proportion of genes are devoted to immune evasion and host-parasite interactions. Many nuclear-encoded proteins are targeted to the apicoplast, an organelle involved in fatty-acid and isoprenoid metabolism. The genome sequence provides the foundation for future studies of this organism, and is being exploited in the search for new drugs and vaccines to fight malaria.}, keywords = {Animals, Chromosome Structures, DNA Repair, DNA Replication, DNA, Protozoan, Evolution, Molecular, Genome, Protozoan, HUMANS, Malaria Vaccines, Malaria, Falciparum, Membrane Transport Proteins, Molecular Sequence Data, Plasmodium falciparum, Plastids, Proteome, Protozoan Proteins, Recombination, Genetic, Sequence Analysis, DNA}, author = {Gardner, Malcolm J. and Hall, Neil and Fung, Eula and White, Owen and Berriman, Matthew and Hyman, Richard W. and Carlton, Jane M. and Pain, Arnab and Nelson, Karen E. and Bowman, Sharen and Paulsen, Ian T. and James, Keith and Eisen, Jonathan A. and Rutherford, Kim and Salzberg, Steven L. and Craig, Alister and Kyes, Sue and Chan, Man-Suen and Nene, Vishvanath and Shallom, Shamira J. and Suh, Bernard and Peterson, Jeremy and Angiuoli, Sam and Pertea, Mihaela and Allen, Jonathan and J. Selengut and Haft, Daniel and Mather, Michael W. and Vaidya, Akhil B. and Martin, David M. A. and Fairlamb, Alan H. and Fraunholz, Martin J. and Roos, David S. and Ralph, Stuart A. and McFadden, Geoffrey I. and Cummings, Leda M. and Subramanian, G. Mani and Mungall, Chris and Venter, J. Craig and Carucci, Daniel J. and Hoffman, Stephen L. and Newbold, Chris and Davis, Ronald W. and Fraser, Claire M. and Barrell, Bart} } @article {49630, title = {Identification of non-autonomous non-LTR retrotransposons in the genome of Trypanosoma cruzi.}, journal = {Mol Biochem Parasitol}, volume = {124}, year = {2002}, month = {2002 Sep-Oct}, pages = {73-8}, abstract = {

As observed for most eukaryotic cells, trypanosomatids contains non-LTR retrotransposons randomly inserted in the nuclear genome. Autonomous retroelements which, code for their own transposition, have been characterized in Trypanosoma brucei (ingi) and Trypanosoma cruzi (L1Tc), whereas non-autonomous retroelements have only been characterized in T. brucei (RIME). Here, we have characterized in the genome of Trypanosoma cruzi four complete copies of a non-autonomous non-LTR retrotransposon, called NARTc. This 0.26 kb NARTc element has the characteristics of non-LTR retrotransposons: the presence a poly(dA) tail and of a short flanking duplicated motif. Analysis of the Genome Survey Sequence databases indicated that the Trypanosoma cruzi haploid genome contains about 140 NARTc copies and about twice as many L1Tc copies. Interestingly, the NARTc and L1Tc retroelements share, with the Trypanosoma brucei ingi and RIME retrotransposons, a common sequence (the first 45 bp with 91\% identity), whereas the remaining sequences are very divergent. This suggests that these four trypanosome non-LTR retrotransposons were derived from the same common ancester and the sequence of their 5{\textquoteright}-extremity may have a functional role. In addition, the genome of Leishmania major contains the same conserved motif present in the trypanosome retroelements, whicle no transposable elements have been detected so far in Leishmania sp.

}, keywords = {Animals, Base Sequence, Computational Biology, Genome, Protozoan, Long Interspersed Nucleotide Elements, Molecular Sequence Data, Retroelements, Short Interspersed Nucleotide Elements, Trypanosoma cruzi}, issn = {0166-6851}, author = {Bringaud, Frederic and Garc{\'\i}a-P{\'e}rez, Jos{\'e} Luis and Heras, Sara R and Ghedin, Elodie and El-Sayed, Najib M and Andersson, Bj{\"o}rn and Baltz, Th{\'e}o and Lopez, Manuel C} } @article {38492, title = {Sequence of Plasmodium falciparum chromosomes 2, 10, 11 and 14}, journal = {NatureNature}, volume = {419}, year = {2002}, note = {http://www.ncbi.nlm.nih.gov/pubmed/12368868?dopt=Abstract}, type = {10.1038/nature01094}, abstract = {The mosquito-borne malaria parasite Plasmodium falciparum kills an estimated 0.7-2.7 million people every year, primarily children in sub-Saharan Africa. Without effective interventions, a variety of factors-including the spread of parasites resistant to antimalarial drugs and the increasing insecticide resistance of mosquitoes-may cause the number of malaria cases to double over the next two decades. To stimulate basic research and facilitate the development of new drugs and vaccines, the genome of Plasmodium falciparum clone 3D7 has been sequenced using a chromosome-by-chromosome shotgun strategy. We report here the nucleotide sequences of chromosomes 10, 11 and 14, and a re-analysis of the chromosome 2 sequence. These chromosomes represent about 35\% of the 23-megabase P. falciparum genome.}, keywords = {Animals, Chromosomes, DNA, Protozoan, Genome, Protozoan, Plasmodium falciparum, Proteome, Protozoan Proteins, Sequence Analysis, DNA}, author = {Gardner, Malcolm J. and Shallom, Shamira J. and Carlton, Jane M. and Salzberg, Steven L. and Nene, Vishvanath and Shoaibi, Azadeh and Ciecko, Anne and Lynn, Jeffery and Rizzo, Michael and Weaver, Bruce and Jarrahi, Behnam and Brenner, Michael and Parvizi, Babak and Tallon, Luke and Moazzez, Azita and Granger, David and Fujii, Claire and Hansen, Cheryl and Pederson, James and Feldblyum, Tamara and Peterson, Jeremy and Suh, Bernard and Angiuoli, Sam and Pertea, Mihaela and Allen, Jonathan and J. Selengut and White, Owen and Cummings, Leda M. and Smith, Hamilton O. and Adams, Mark D. and Venter, J. Craig and Carucci, Daniel J. and Hoffman, Stephen L. and Fraser, Claire M.} }