@booklet {49615, title = {Algorithms in Bioinformatics: 15th International Workshop, WABI 2015}, howpublished = {Lecture Notes in Bioinformatics}, number = {9289}, year = {2015}, month = {September 2015}, pages = {328}, publisher = {Springer}, isbn = {978-3-662-48220-9}, author = {Pop, Mihai and Touzet, H{\'e}l{\`e}ne}, editor = {Istrail, Sorin and Pevzner, Pavel and Waterman, Michael S} } @article {45867, title = {Automated ensemble assembly and validation of microbial genomes.}, journal = {BMC Bioinformatics}, volume = {15}, year = {2014}, month = {2014}, pages = {126}, abstract = {

BACKGROUND: The continued democratization of DNA sequencing has sparked a new wave of development of genome assembly and assembly validation methods. As individual research labs, rather than centralized centers, begin to sequence the majority of new genomes, it is important to establish best practices for genome assembly. However, recent evaluations such as GAGE and the Assemblathon have concluded that there is no single best approach to genome assembly. Instead, it is preferable to generate multiple assemblies and validate them to determine which is most useful for the desired analysis; this is a labor-intensive process that is often impossible or unfeasible.

RESULTS: To encourage best practices supported by the community, we present iMetAMOS, an automated ensemble assembly pipeline; iMetAMOS encapsulates the process of running, validating, and selecting a single assembly from multiple assemblies. iMetAMOS packages several leading open-source tools into a single binary that automates parameter selection and execution of multiple assemblers, scores the resulting assemblies based on multiple validation metrics, and annotates the assemblies for genes and contaminants. We demonstrate the utility of the ensemble process on 225 previously unassembled Mycobacterium tuberculosis genomes as well as a Rhodobacter sphaeroides benchmark dataset. On these real data, iMetAMOS reliably produces validated assemblies and identifies potential contamination without user intervention. In addition, intelligent parameter selection produces assemblies of R. sphaeroides comparable to or exceeding the quality of those from the GAGE-B evaluation, affecting the relative ranking of some assemblers.

CONCLUSIONS: Ensemble assembly with iMetAMOS provides users with multiple, validated assemblies for each genome. Although computationally limited to small or mid-sized genomes, this approach is the most effective and reproducible means for generating high-quality assemblies and enables users to select an assembly best tailored to their specific needs.

}, keywords = {Genome, Bacterial, Genome, Microbial, Genomics, Mycobacterium tuberculosis, Rhodobacter sphaeroides, Sequence Analysis, DNA, software}, issn = {1471-2105}, doi = {10.1186/1471-2105-15-126}, author = {Koren, Sergey and Todd Treangen and Hill, Christopher M and Pop, Mihai and Phillippy, Adam M} } @inbook {38124, title = {AWTY, BAMBE, BEAGLE, BEAST, BEAUti, Bio++, DataMonkey, DendroPy, DnaSP, ENCprime/SeqCount, FigTree, GARLI, genealogical sorting index (gsi), HyPhy, IMa2, jModelTest, JELLYFISH, LAMARC, MacClade, MEGA, Mesquite}, booktitle = {Dictionary of Bioinformatics}, year = {2013}, publisher = {Wiley-Liss}, organization = {Wiley-Liss}, address = {Hoboken}, author = {Michael P. Cummings}, editor = {Hancock, J. and Zvelebil, M.} } @article {38107, title = {AGORA: Assembly Guided by Optical Restriction Alignment}, journal = {BMC bioinformaticsBMC Bioinformatics}, volume = {13}, year = {2012}, publisher = {BioMed Central Ltd}, author = {Lin, H. C. and Goldstein, S. and L. Mendelowitz and Zhou, S. and Wetzel, J. and Schwartz, D. C. and M. Pop} } @article {38119, title = {Archaeosortases and exosortases are widely distributed systems linking membrane transit with posttranslational modification}, journal = {Journal of bacteriologyJournal of bacteriology}, volume = {194}, year = {2012}, note = {http://www.ncbi.nlm.nih.gov/pubmed/22037399?dopt=Abstract}, type = {10.1128/JB.06026-11}, abstract = {Multiple new prokaryotic C-terminal protein-sorting signals were found that reprise the tripartite architecture shared by LPXTG and PEP-CTERM: motif, TM helix, basic cluster. Defining hidden Markov models were constructed for all. PGF-CTERM occurs in 29 archaeal species, some of which have more than 50 proteins that share the domain. PGF-CTERM proteins include the major cell surface protein in Halobacterium, a glycoprotein with a partially characterized diphytanylglyceryl phosphate linkage near its C terminus. Comparative genomics identifies a distant exosortase homolog, designated archaeosortase A (ArtA), as the likely protein-processing enzyme for PGF-CTERM. Proteomics suggests that the PGF-CTERM region is removed. Additional systems include VPXXXP-CTERM/archeaosortase B in two of the same archaea and PEF-CTERM/archaeosortase C in four others. Bacterial exosortases often fall into subfamilies that partner with very different cohorts of extracellular polymeric substance biosynthesis proteins; several species have multiple systems. Variant systems include the VPDSG-CTERM/exosortase C system unique to certain members of the phylum Verrucomicrobia, VPLPA-CTERM/exosortase D in several alpha- and deltaproteobacterial species, and a dedicated (single-target) VPEID-CTERM/exosortase E system in alphaproteobacteria. Exosortase-related families XrtF in the class Flavobacteria and XrtG in Gram-positive bacteria mark distinctive conserved gene neighborhoods. A picture emerges of an ancient and now well-differentiated superfamily of deeply membrane-embedded protein-processing enzymes. Their target proteins are destined to transit cellular membranes during their biosynthesis, during which most undergo additional posttranslational modifications such as glycosylation.}, keywords = {Amino Acid Sequence, Aminoacyltransferases, Archaeal Proteins, Bacterial Proteins, Cell Membrane, Cysteine Endopeptidases, Gene Expression Regulation, Archaeal, Gene Expression Regulation, Bacterial, Gene Expression Regulation, Enzymologic, Molecular Sequence Data, Protein Processing, Post-Translational}, author = {Haft, Daniel H. and Payne, Samuel H. and J. Selengut} } @article {49775, title = {Archaeosortases and exosortases are widely distributed systems linking membrane transit with posttranslational modification.}, journal = {J Bacteriol}, volume = {194}, year = {2012}, month = {2012 Jan}, pages = {36-48}, abstract = {

Multiple new prokaryotic C-terminal protein-sorting signals were found that reprise the tripartite architecture shared by LPXTG and PEP-CTERM: motif, TM helix, basic cluster. Defining hidden Markov models were constructed for all. PGF-CTERM occurs in 29 archaeal species, some of which have more than 50 proteins that share the domain. PGF-CTERM proteins include the major cell surface protein in Halobacterium, a glycoprotein with a partially characterized diphytanylglyceryl phosphate linkage near its C terminus. Comparative genomics identifies a distant exosortase homolog, designated archaeosortase A (ArtA), as the likely protein-processing enzyme for PGF-CTERM. Proteomics suggests that the PGF-CTERM region is removed. Additional systems include VPXXXP-CTERM/archeaosortase B in two of the same archaea and PEF-CTERM/archaeosortase C in four others. Bacterial exosortases often fall into subfamilies that partner with very different cohorts of extracellular polymeric substance biosynthesis proteins; several species have multiple systems. Variant systems include the VPDSG-CTERM/exosortase C system unique to certain members of the phylum Verrucomicrobia, VPLPA-CTERM/exosortase D in several alpha- and deltaproteobacterial species, and a dedicated (single-target) VPEID-CTERM/exosortase E system in alphaproteobacteria. Exosortase-related families XrtF in the class Flavobacteria and XrtG in Gram-positive bacteria mark distinctive conserved gene neighborhoods. A picture emerges of an ancient and now well-differentiated superfamily of deeply membrane-embedded protein-processing enzymes. Their target proteins are destined to transit cellular membranes during their biosynthesis, during which most undergo additional posttranslational modifications such as glycosylation.

}, keywords = {Amino Acid Sequence, Aminoacyltransferases, Archaeal Proteins, Bacterial Proteins, Cell Membrane, Cysteine Endopeptidases, Gene Expression Regulation, Archaeal, Gene Expression Regulation, Bacterial, Gene Expression Regulation, Enzymologic, Molecular Sequence Data, Protein Processing, Post-Translational}, issn = {1098-5530}, doi = {10.1128/JB.06026-11}, author = {Haft, Daniel H and Payne, Samuel H and Selengut, Jeremy D} } @article {38101, title = {Accelerated evolution of 3{\textquoteright}avian FOXE1 genes, and thyroid and feather specific expression of chicken FoxE1}, journal = {BMC Evolutionary BiologyBMC Evolutionary Biology}, volume = {11}, year = {2011}, type = {10.1186/1471-2148-11-302}, abstract = {The forkhead transcription factor gene E1 (FOXE1) plays an important role in regulation of thyroid development, palate formation and hair morphogenesis in mammals. However, avian FOXE1 genes have not been characterized and as such, codon evolution of FOXE1 orthologs in a broader evolutionary context of mammals and birds is not known.}, isbn = {1471-2148}, author = {Yaklichkin, Sergey Yu and Darnell, Diana K. and Pier, Maricela V. and Antin, Parker B. and Sridhar Hannenhalli} } @article {38102, title = {Accurate and fast estimation of taxonomic profiles from metagenomic shotgun sequences}, journal = {BMC GenomicsBMC Genomics}, volume = {12}, year = {2011}, type = {10.1186/1471-2164-12-S2-S4}, abstract = {A major goal of metagenomics is to characterize the microbial composition of an environment. The most popular approach relies on 16S rRNA sequencing, however this approach can generate biased estimates due to differences in the copy number of the gene between even closely related organisms, and due to PCR artifacts. The taxonomic composition can also be determined from metagenomic shotgun sequencing data by matching individual reads against a database of reference sequences. One major limitation of prior computational methods used for this purpose is the use of a universal classification threshold for all genes at all taxonomic levels.}, isbn = {1471-2164}, author = {Liu, Bo and Gibbons, Theodore and Ghodsi, Mohammad and Todd Treangen and M. Pop} } @article {49744, title = {Accurate proteome-wide protein quantification from high-resolution 15N mass spectra.}, journal = {Genome Biol}, volume = {12}, year = {2011}, month = {2011}, pages = {R122}, abstract = {

In quantitative mass spectrometry-based proteomics, the metabolic incorporation of a single source of 15N-labeled nitrogen has many advantages over using stable isotope-labeled amino acids. However, the lack of a robust computational framework for analyzing the resulting spectra has impeded wide use of this approach. We have addressed this challenge by introducing a new computational methodology for analyzing 15N spectra in which quantification is integrated with identification. Application of this method to an Escherichia coli growth transition reveals significant improvement in quantification accuracy over previous methods.

}, keywords = {algorithms, Amino Acid Sequence, Bacterial Proteins, Escherichia coli, Isotope Labeling, Mass Spectrometry, Molecular Sequence Data, Nitrogen Isotopes, Proteome, proteomics, Sensitivity and Specificity, software}, issn = {1474-760X}, doi = {10.1186/gb-2011-12-12-r122}, author = {Khan, Zia and Amini, Sasan and Bloom, Joshua S and Ruse, Cristian and Caudy, Amy A and Kruglyak, Leonid and Singh, Mona and Perlman, David H and Tavazoie, Saeed} } @article {49554, title = {Accurate proteome-wide protein quantification from high-resolution 15N mass spectra}, volume = {12}, year = {2011}, month = {Jan-01-2011}, pages = {R122}, issn = {1465-6906}, doi = {10.1186/gb-2011-12-12-r122}, url = {http://genomebiology.com/2012/12/12/R122}, author = {Khan, Zia and Amini, Sasan and Bloom, Joshua S and Ruse, Cristian and Caudy, Amy A and Kruglyak, Leonid and Singh, Mona and Perlman, David H and Tavazoie, Saeed} } @article {38118, title = {Aquatic Realm and Cholera}, journal = {Epidemiological and Molecular Aspects on CholeraEpidemiological and Molecular Aspects on Cholera}, year = {2011}, type = {10.1007/978-1-60327-265-0_18}, abstract = {Cholera is an ancient disease that can be severe and life threatening. It occurs predominantly in areas of the world where populations lack safe drinking water. Epidemics of cholera are linked with malnutrition, poor sanitation, and conditions resulting from natural disasters such as severe flooding. According to a report published by WHO in 2000 [1], cholera remains a major public health problem and is becoming increasingly important since the number of countries in which cholera is endemic continues to increase. Unfortunately, outbreaks of the disease continue into the twenty-first century with ominous portent in the wake of global climate change [1]. Yet cholera is a preventable disease if people have access to safe drinking water and are properly educated how to protect themselves from the risk of infection with vibrios. Cholera also is an easily treatable disease. Oral rehydration therapy, a solution containing glucose and appropriate salts, has proven to be effective for treatment of most cholera victims [2]. Nevertheless, each year, tens of thousands of people are victims of the disease, bringing this {\textquotedblleft}curse of humankind{\textquotedblright} to modern civilization. Present understanding of cholera is based on studies conducted over the past three decades and significant new information has been gained concerning environmental factors associated with this disease, especially how to detect the bacterium and where it lives in the natural environment, outside the human gut, and what triggers the annual outbreaks that occur with remarkable regularity. Environmental research on Vibrio cholerae and cholera has provided insights for prediction and prevention of the disease it causes, while the race for effective vaccines against cholera continues.}, author = {Huq, A. and Grim, C. J. and Rita R. Colwell} } @article {38122, title = {Assessing the benefits of using mate-pairs to resolve repeats in de novo short-read prokaryotic assemblies}, journal = {BMC bioinformaticsBMC Bioinformatics}, volume = {12}, year = {2011}, publisher = {BioMed Central Ltd}, author = {Wetzel, J. and Kingsford, Carl and M. Pop} } @article {38109, title = {Alignment and clustering of phylogenetic markers - implications for microbial diversity studies}, journal = {BMC BioinformaticsBMC Bioinformatics}, volume = {11}, year = {2010}, type = {10.1186/1471-2105-11-152}, abstract = {Molecular studies of microbial diversity have provided many insights into the bacterial communities inhabiting the human body and the environment. A common first step in such studies is a survey of conserved marker genes (primarily 16S rRNA) to characterize the taxonomic composition and diversity of these communities. To date, however, there exists significant variability in analysis methods employed in these studies.}, isbn = {1471-2105}, author = {White, James R. and Navlakha, Saket and Nagarajan, Niranjan and Ghodsi, Mohammad-Reza and Kingsford, Carl and M. Pop} } @article {49648, title = {The Alveolate Perkinsus marinus: biological insights from EST gene discovery.}, journal = {BMC Genomics}, volume = {11}, year = {2010}, month = {2010}, pages = {228}, abstract = {

BACKGROUND: Perkinsus marinus, a protozoan parasite of the eastern oyster Crassostrea virginica, has devastated natural and farmed oyster populations along the Atlantic and Gulf coasts of the United States. It is classified as a member of the Perkinsozoa, a recently established phylum considered close to the ancestor of ciliates, dinoflagellates, and apicomplexans, and a key taxon for understanding unique adaptations (e.g. parasitism) within the Alveolata. Despite intense parasite pressure, no disease-resistant oysters have been identified and no effective therapies have been developed to date.

RESULTS: To gain insight into the biological basis of the parasite{\textquoteright}s virulence and pathogenesis mechanisms, and to identify genes encoding potential targets for intervention, we generated>31,000 5{\textquoteright} expressed sequence tags (ESTs) derived from four trophozoite libraries generated from two P. marinus strains. Trimming and clustering of the sequence tags yielded 7,863 unique sequences, some of which carry a spliced leader. Similarity searches revealed that 55\% of these had hits in protein sequence databases, of which 1,729 had their best hit with proteins from the chromalveolates (E-value

CONCLUSIONS: Our transcriptome analysis of P. marinus, the first for any member of the Perkinsozoa, contributes new insight into its biology and taxonomic position. It provides a very informative, albeit preliminary, glimpse into the expression of genes encoding functionally relevant proteins as potential targets for chemotherapy, and evidence for the presence of a relict plastid. Further, although P. marinus sequences display significant similarity to those from both apicomplexans and dinoflagellates, the presence of trans-spliced transcripts confirms the previously established affinities with the latter. The EST analysis reported herein, together with the recently completed sequence of the P. marinus genome and the development of transfection methodology, should result in improved intervention strategies against dermo disease.

}, keywords = {Alveolata, Animals, Expressed Sequence Tags, Ostreidae, Phylogeny}, issn = {1471-2164}, doi = {10.1186/1471-2164-11-228}, author = {Joseph, Sandeep J and Fern{\'a}ndez-Robledo, Jos{\'e} A and Gardner, Malcolm J and El-Sayed, Najib M and Kuo, Chih-Horng and Schott, Eric J and Wang, Haiming and Kissinger, Jessica C and Vasta, Gerardo R} } @article {38121, title = {Assembly complexity of prokaryotic genomes using short reads}, journal = {BMC bioinformaticsBMC Bioinformatics}, volume = {11}, year = {2010}, publisher = {BioMed Central Ltd}, author = {Kingsford, Carl and Schatz, M. and M. Pop} } @article {38114, title = {Analysis of clonally related environmental Vibrio cholerae O1 El Tor isolated before 1992 from Varanasi, India reveals origin of SXT-ICEs belonging to O139 and O1 serogroups}, journal = {Environmental Microbiology ReportsEnvironmental Microbiology Reports}, volume = {2}, year = {2009}, type = {10.1111/j.1758-2229.2009.00051.x}, abstract = {In this study, we report the presence of SXT in environmental Vibrio cholerae O1 El Tor strains isolated before 1992 from Varanasi, India. All isolates, except one, were resistant to Tm, and/or Sul, Sm, Fr, Na and Am. None contained plasmids. PCR and DNA sequencing revealed the presence of SXT containing dfrA1 and/or sulII, strAB in six isolates and dfr18, sulII and strAB in five isolates. Three clinical V. cholerae O1 isolated during 1992 contained the antibiotic resistance gene cassette aadA1 in the class 1 integron. Conjugation experiments, followed by PCR analysis of transconjugants, provided evidence of the transferable nature of SXT and associated antibiotic resistance genes, and its integration into the prfC site. Results of phylogenetic analysis of the intSXT gene of clonally similar V. cholerae showed a clear difference between dfr18+ and dfrA1+V. cholerae O1 isolates. This is the first report of the occurrence of SXT harbouring sulII, strAB, dfr18 and/or dfrA1 genes in environmental V. cholerae O1 isolated prior to 1992 from Varanasi, India, and suggests emergence of SXT+ antibiotic-resistant V. cholerae O139 and O1 from an environmental V. cholerae progenitor by acquisition of SXT and antibiotic-resistant gene clusters.}, isbn = {1758-2229}, author = {Mohapatra, Saswat S. and Mantri, Chinmay K. and Mohapatra, Harapriya and Rita R. Colwell and Singh, Durg V.} } @article {38120, title = {ARDB--Antibiotic Resistance Genes Database}, journal = {Nucleic Acids ResearchNucleic Acids Research}, volume = {37}, year = {2009}, type = {10.1093/nar/gkn656}, abstract = {The treatment of infections is increasingly compromised by the ability of bacteria to develop resistance to antibiotics through mutations or through the acquisition of resistance genes. Antibiotic resistance genes also have the potential to be used for bio-terror purposes through genetically modified organisms. In order to facilitate the identification and characterization of these genes, we have created a manually curated database{\textemdash}the Antibiotic Resistance Genes Database (ARDB){\textemdash}unifying most of the publicly available information on antibiotic resistance. Each gene and resistance type is annotated with rich information, including resistance profile, mechanism of action, ontology, COG and CDD annotations, as well as external links to sequence and protein databases. Our database also supports sequence similarity searches and implements an initial version of a tool for characterizing common mutations that confer antibiotic resistance. The information we provide can be used as compendium of antibiotic resistance factors as well as to identify the resistance genes of newly sequenced genes, genomes, or metagenomes. Currently, ARDB contains resistance information for 13 293 genes, 377 types, 257 antibiotics, 632 genomes, 933 species and 124 genera. ARDB is available at http://ardb.cbcb.umd.edu/.}, isbn = {0305-1048, 1362-4962}, author = {Liu, B. and M. Pop} } @article {49645, title = {Assessing Student Understanding of Host Pathogen Interactions Using a Concept Inventory}, journal = {J. Microbiol. Biol. Ed.}, volume = {10}, year = {2009}, pages = {43-50}, author = {Marbach-Ad, G. and Briken, V. and El-Sayed, N.M. and Frauwirth, K. and Fredericksen, B. and Hutcheson, S. and Gao, L.-Y. and Joseph, S. and Lee, V. and McIver, K.S. and Mosser, D. and Quimby, B.B. and Shields, P. and Song, W. and Stein, D.C. and Yuan, R.T. and Smith, A.C.} } @article {49835, title = {Automated classification of bird and amphibian calls using machine learning: A comparison of methods}, journal = {Ecological Informatics}, volume = {4}, year = {2009}, month = {Jan-09-2009}, pages = {206 - 214}, issn = {15749541}, doi = {10.1016/j.ecoinf.2009.06.005}, url = {http://linkinghub.elsevier.com/retrieve/pii/S1574954109000351http://api.elsevier.com/content/article/PII:S1574954109000351?httpAccept=text/xmlhttp://api.elsevier.com/content/article/PII:S1574954109000351?httpAccept=text/plain}, author = {Acevedo, Miguel A. and Corrada-Bravo, Carlos J. and Corrada-Bravo, Hector and Villanueva-Rivera, Luis J. and Aide, T. Mitchell} } @book {38108, title = {Algorithms in Bioinformatics: 7th International Workshop, WABI 2007, Philadelphia, PA, USA, September 8-9, 2007, Proceedings}, volume = {4645}, year = {2007}, publisher = {Springer}, organization = {Springer}, author = {Giancarlo, R. and Sridhar Hannenhalli} } @article {49852, title = {Analyzing patterns of microbial evolution using the mauve genome alignment system}, journal = {Comparative Genomics}, year = {2007}, pages = {135{\textendash}152}, author = {Darling, Aaron E and Todd Treangen and Messeguer, Xavier and Perna, Nicole T} } @article {38123, title = {Association of Vibrio Cholerae O1 El Tor and O139 Bengal with the Copepods Acartia Tonsa and Eurytemora Affinis}, journal = {Applied and Environmental MicrobiologyAppl. Environ. Microbiol.Applied and Environmental MicrobiologyAppl. Environ. Microbiol.}, volume = {73}, year = {2007}, type = {10.1128/AEM.01238-07}, abstract = {The association of Vibrio cholerae with zooplankton has been suggested as an important factor in transmission of human epidemic cholera, and the ability to colonize zooplankton surfaces may play a role in the temporal variation and predominance of the two different serogroups (V. cholerae O1 El Tor and O139) in the aquatic environment. To date, interactions between specific serogroups and species of plankton remain poorly understood. Laboratory microcosm experiments were carried out to compare quantitatively the colonization of two copepod species, Acartia tonsa and Eurytemora affinis, by each of the epidemic serogroups. V. cholerae O1 consistently achieved higher abundances than V. cholerae O139 in colonizing adults of each copepod species as well as the multiple life stages of E. affinis. This difference in colonization may be significant in the general predominance of V. cholerae O1 in cholera epidemics in rural Bangladesh where water supplies are taken directly from the environment.}, isbn = {0099-2240, 1098-5336}, author = {Rawlings, Tonya K. and Ruiz, Gregory M. and Rita R. Colwell} } @article {49641, title = {Analysis of fat body transcriptome from the adult tsetse fly, Glossina morsitans morsitans.}, journal = {Insect Mol Biol}, volume = {15}, year = {2006}, month = {2006 Aug}, pages = {411-24}, abstract = {

Tsetse flies (Diptera: Glossinidia) are vectors of pathogenic African trypanosomes. To develop a foundation for tsetse physiology, a normalized expressed sequence tag (EST) library was constructed from fat body tissue of immune-stimulated Glossina morsitans morsitans. Analysis of 20,257 high-quality ESTs yielded 6372 unique genes comprised of 3059 tentative consensus (TC) sequences and 3313 singletons (available at http://aksoylab.yale.edu). We analysed the putative fat body transcriptome based on homology to other gene products with known functions available in the public domain. In particular, we describe the immune-related products, reproductive function related yolk proteins and milk-gland protein, iron metabolism regulating ferritins and transferrin, and tsetse{\textquoteright}s major energy source proline biosynthesis. Expression analysis of the three yolk proteins indicates that all are detected in females, while only the yolk protein with similarity to lipases, is expressed in males. Milk gland protein, apparently important for larval nutrition, however, is primarily synthesized by accessory milk gland tissue.

}, keywords = {Adipose Tissue, Animals, Base Sequence, Computational Biology, DNA Primers, Egg Proteins, Expressed Sequence Tags, Female, Gene Expression Profiling, Insect Vectors, Male, Molecular Sequence Data, Reverse Transcriptase Polymerase Chain Reaction, Sequence Analysis, DNA, Sex Factors, Tsetse Flies}, issn = {0962-1075}, doi = {10.1111/j.1365-2583.2006.00649.x}, author = {Attardo, G M and Strickler-Dinglasan, P and Perkin, S A H and Caler, E and Bonaldo, M F and Soares, M B and El-Sayeed, N and Aksoy, S} } @proceedings {38100, title = {Abstracting workflows: unifying bioinformatics task conceptualization and specification through Semantic Web services}, year = {2004}, month = {2004}, address = {Cambridge, Massachusetts USA}, author = {Hashmi, N. and Lee, S. and Michael P. Cummings} } @article {38103, title = {Acinetobacter lipases: molecular biology, biochemical properties and biotechnological potential}, journal = {Journal of industrial microbiology \& biotechnologyJournal of industrial microbiology \& biotechnology}, volume = {31}, year = {2004}, type = {10.1007/s10295-004-0167-0}, abstract = {Lipases (EC 3.1.1.3) have received increased attention recently, evidenced by the increasing amount of information about lipases in the current literature. The renewed interest in this enzyme class is due primarily to investigations of their role in pathogenesis and their increasing use in biotechnological applications [38]. Also, many microbial lipases are available as commercial products, the majority of which are used in detergents, cosmetic production, food flavoring, and organic synthesis. Lipases are valued biocatalysts because they act under mild conditions, are highly stable in organic solvents, show broad substrate specificity, and usually show high regio- and/or stereo-selectivity in catalysis. A number of lipolytic strains of Acinetobacter have been isolated from a variety of sources and their lipases possess many biochemical properties similar to those that have been developed for biotechnological applications. This review discusses the biology of lipase expression in Acinetobacter, with emphasis on those aspects relevant to potential biotechnology applications.}, author = {Snellman, E. A. and Rita R. Colwell} } @article {38104, title = {Advances in schistosome genomics}, journal = {Trends in ParasitologyTrends in Parasitology}, volume = {20}, year = {2004}, type = {16/j.pt.2004.02.002}, abstract = {In Spring 2004, the first draft of the 270~Mb genome of Schistosoma mansoni will be released. This sequence is based on the assembly and annotation of a >7.5-fold coverage, shotgun sequencing project. The key stages involved in the international collaborative efforts that have led to the generation of these sequencing data for the parasite S. mansoni are discussed here.}, isbn = {1471-4922}, author = {Najib M. El-Sayed and Bartholomeu, Daniella and Ivens, Alasdair and Johnston, David A. and LoVerde, Philip T.} } @article {38117, title = {Applying permutation tests to tree-based statistical models: extending the R package rpart}, volume = {2004-24}, year = {2004}, institution = {University of Maryland Institute for Advanced Computer Studies}, abstract = {Tree-based statistical models are useful for evaluating relationships between predictor and response variables and for generating predictions when the response is unknown. However, current methods of constructing tree-based models do not provide a probabilistic assessment of the models produced. Here we describe our work to use permutation tests to quantitatively estimate the probability of tree-based statistical models. We have extended the rpart (recursive partitioning) package of the R system for statistical data analysis. This extension, rpart.permutation, executes the permutations in parallel, using MPI (Message Passing Interface) to greatly decrease the time necessary to complete the analysis.}, author = {Michael P. Cummings and Myers, D. S. and Mangelson, M.} } @article {38116, title = {ANNUAL REVIEW \& FORECAST REPORTS-THE OCEANS: TO PROTECT AND TO PLOW}, journal = {Sea TechnologySea Technology}, volume = {44}, year = {2003}, author = {Rita R. Colwell} } @article {38112, title = {Analysis of 16S-23S rRNA intergenic spacer of Vibrio cholerae and Vibrio mimicus for detection of these species}, journal = {METHODS IN MOLECULAR BIOLOGYMETHODS IN MOLECULAR BIOLOGY}, volume = {179}, year = {2002}, type = {10.1385/1-59259-238-4:171}, author = {Chun, J. and Rivera, I. N. G. and Rita R. Colwell} } @article {38115, title = {Analysis of stage-specific gene expression in the bloodstream and the procyclic form of Trypanosoma brucei using a genomic DNA-microarray}, journal = {Molecular and Biochemical ParasitologyMolecular and Biochemical Parasitology}, volume = {123}, year = {2002}, type = {16/S0166-6851(02)00138-X}, abstract = {A microarray comprising 21[punctuation space]024 different PCR products spotted on glass slides was constructed for gene expression studies on Trypanosoma brucei. The arrayed fragments were generated from a T. brucei shotgun clone library, which had been prepared from randomly sheared and size-fractionated genomic DNA. For the identification of stage-specific gene activity, total RNA from in vitro cultures of the human, long slender form and the insect, procyclic form of the parasite was labelled and hybridised to the microarray. Approximately 75\% of the genomic fragments produced a signal and about 2\% exhibited significant differences between the transcript levels in the bloodstream and procyclic forms. A few results were confirmed by Northern blot analysis or reverse-transcription and PCR. Three hundred differentially regulated clones have been selected for sequencing. So far, of 33 clones that showed about 2-fold or more over-expression in bloodstream forms, 15 contained sequences similar to those of VSG expression sites and at least six others appeared non-protein-coding. Of 29 procyclic-specific clones, at least eight appeared not to be protein-coding. A surprisingly large proportion of known regulated genes was already identified in this small sample, and some new ones were found, illustrating the utility of genomic arrays.}, keywords = {Expression, Gene, Microarray, Regulation, Trypanosoma brucei}, isbn = {0166-6851}, author = {Diehl, Susanne and Diehl, Frank and Najib M. El-Sayed and Clayton, Christine and Hoheisel, J{\"o}rg D.} } @article {49629, title = {Analysis of stage-specific gene expression in the bloodstream and the procyclic form of Trypanosoma brucei using a genomic DNA-microarray.}, journal = {Mol Biochem Parasitol}, volume = {123}, year = {2002}, month = {2002 Aug 28}, pages = {115-23}, abstract = {

A microarray comprising 21,024 different PCR products spotted on glass slides was constructed for gene expression studies on Trypanosoma brucei. The arrayed fragments were generated from a T. brucei shotgun clone library, which had been prepared from randomly sheared and size-fractionated genomic DNA. For the identification of stage-specific gene activity, total RNA from in vitro cultures of the human, long slender form and the insect, procyclic form of the parasite was labelled and hybridised to the microarray. Approximately 75\% of the genomic fragments produced a signal and about 2\% exhibited significant differences between the transcript levels in the bloodstream and procyclic forms. A few results were confirmed by Northern blot analysis or reverse-transcription and PCR. Three hundred differentially regulated clones have been selected for sequencing. So far, of 33 clones that showed about 2-fold or more over-expression in bloodstream forms, 15 contained sequences similar to those of VSG expression sites and at least six others appeared non-protein-coding. Of 29 procyclic-specific clones, at least eight appeared not to be protein-coding. A surprisingly large proportion of known regulated genes was already identified in this small sample, and some new ones were found, illustrating the utility of genomic arrays.

}, keywords = {Animals, Blotting, Northern, Escherichia coli, Gene expression, Gene Expression Profiling, Genes, Protozoan, HUMANS, Life Cycle Stages, Molecular Sequence Data, Oligonucleotide Array Sequence Analysis, Polymerase Chain Reaction, Transcription, Genetic, Trypanosoma brucei brucei}, issn = {0166-6851}, author = {Diehl, Susanne and Diehl, Frank and El-Sayed, Najib M and Clayton, Christine and Hoheisel, J{\"o}rg D} } @article {38111, title = {Analysis and prediction of protein functional sub-types from protein sequence alignments}, year = {2001}, note = {EP Patent 1,096,411}, author = {Sridhar Hannenhalli and Russell, R. B.} } @article {38113, title = {Analysis of a donor gene region for a variant surface glycoprotein and its expression site in African trypanosomes}, journal = {Nucleic acids researchNucleic Acids Research}, volume = {29}, year = {2001}, author = {LaCount, D. J. and Najib M. El-Sayed and Kaul, S. and Wanless, D. and Turner, C. M. R. and Donelson, J. E.} } @conference {49569, title = {Automatically tracking and analyzing the behavior of live insect colonies}, booktitle = {the fifth international conferenceProceedings of the fifth international conference on Autonomous agents - AGENTS {\textquoteright}01}, year = {2001}, publisher = {ACM Press}, organization = {ACM Press}, address = {Montreal, Quebec, CanadaNew York, New York, USA}, isbn = {158113326X}, doi = {10.1145/37573510.1145/375735.376434}, url = {http://portal.acm.org/citation.cfm?doid=375735http://portal.acm.org/citation.cfm?doid=375735.376434}, author = {Balch, Tucker and Khan, Zia and Veloso, Manuela} } @article {38105, title = {The African trypanosome genome}, journal = {International Journal for ParasitologyInternational Journal for Parasitology}, volume = {30}, year = {2000}, type = {16/S0020-7519(00)00015-1}, abstract = {The haploid nuclear genome of the African trypanosome, Trypanosoma brucei, is about 35 Mb and varies in size among different trypanosome isolates by as much as 25\%. The nuclear DNA of this diploid organism is distributed among three size classes of chromosomes: the megabase chromosomes of which there are at least 11 pairs ranging from 1 Mb to more than 6 Mb (numbered I-XI from smallest to largest); several intermediate chromosomes of 200-900 kb and uncertain ploidy; and about 100 linear minichromosomes of 50-150 kb. Size differences of as much as four-fold can occur, both between the two homologues of a megabase chromosome pair in a specific trypanosome isolate and among chromosome pairs in different isolates. The genomic DNA sequences determined to date indicated that about 50\% of the genome is coding sequence. The chromosomal telomeres possess TTAGGG repeats and many, if not all, of the telomeres of the megabase and intermediate chromosomes are linked to expression sites for genes encoding variant surface glycoproteins (VSGs). The minichromosomes serve as repositories for VSG genes since some but not all of their telomeres are linked to unexpressed VSG genes. A gene discovery program, based on sequencing the ends of cloned genomic DNA fragments, has generated more than 20 Mb of discontinuous single-pass genomic sequence data during the past year, and the complete sequences of chromosomes I and II (about 1 Mb each) in T. brucei GUTat 10.1 are currently being determined. It is anticipated that the entire genomic sequence of this organism will be known in a few years. Analysis of a test microarray of 400 cDNAs and small random genomic DNA fragments probed with RNAs from two developmental stages of T. brucei demonstrates that the microarray technology can be used to identify batteries of genes differentially expressed during the various life cycle stages of this parasite.}, isbn = {0020-7519}, author = {Najib M. El-Sayed and Hegde, Priti and Quackenbush, John and Melville, Sara E. and Donelson, John E.} } @article {38110, title = {Analysis and prediction of functional sub-types from protein sequence alignments}, journal = {Journal of Molecular BiologyJournal of Molecular Biology}, volume = {303}, year = {2000}, type = {10.1006/jmbi.2000.4036}, abstract = {The increasing number and diversity of protein sequence families requires new methods to define and predict details regarding function. Here, we present a method for analysis and prediction of functional sub-types from multiple protein sequence alignments. Given an alignment and set of proteins grouped into sub-types according to some definition of function, such as enzymatic specificity, the method identifies positions that are indicative of functional differences by comparison of sub-type specific sequence profiles, and analysis of positional entropy in the alignment. Alignment positions with significantly high positional relative entropy correlate with those known to be involved in defining sub-types for nucleotidyl cyclases, protein kinases, lactate/malate dehydrogenases and trypsin-like serine proteases. We highlight new positions for these proteins that suggest additional experiments to elucidate the basis of specificity. The method is also able to predict sub-type for unclassified sequences. We assess several variations on a prediction method, and compare them to simple sequence comparisons. For assessment, we remove close homologues to the sequence for which a prediction is to be made (by a sequence identity above a threshold). This simulates situations where a protein is known to belong to a protein family, but is not a close relative of another protein of known sub-type. Considering the four families above, and a sequence identity threshold of 30 \%, our best method gives an accuracy of 96 \% compared to 80 \% obtained for sequence similarity and 74 \% for BLAST. We describe the derivation of a set of sub-type groupings derived from an automated parsing of alignments from PFAM and the SWISSPROT database, and use this to perform a large-scale assessment. The best method gives an average accuracy of 94 \% compared to 68 \% for sequence similarity and 79 \% for BLAST. We discuss implications for experimental design, genome annotation and the prediction of protein function and protein intra-residue distances.}, keywords = {prediction, protein function, protein structure, sequence alignment}, isbn = {0022-2836}, author = {Sridhar Hannenhalli and Russell, Robert B.} } @article {38106, title = {African trypanosomes have differentially expressed genes encoding homologues of the Leishmania GP63 surface protease}, journal = {Journal of Biological ChemistryJournal of Biological Chemistry}, volume = {272}, year = {1997}, author = {Najib M. El-Sayed and Donelson, J. E.} } @article {49695, title = {AT-AC introns: an ATtACk on dogma.}, journal = {Science}, volume = {271}, year = {1996}, month = {1996 Mar 22}, pages = {1690-2}, keywords = {Animals, Base Composition, Base Sequence, Consensus Sequence, HUMANS, Introns, Molecular Sequence Data, Mutation, RNA Precursors, RNA Splicing, RNA, Small Nuclear, Spliceosomes}, issn = {0036-8075}, author = {Mount, S M} } @article {49721, title = {Are snRNPs involved in splicing?}, journal = {Nature}, volume = {283}, year = {1980}, month = {1980 Jan 10}, pages = {220-4}, keywords = {Animals, Base Sequence, Cell Line, Chickens, Erythrocytes, HUMANS, Liver, Lupus Erythematosus, Systemic, Molecular Weight, Nucleic Acid Precursors, Nucleoproteins, Ribonucleoproteins, RNA, Heterogeneous Nuclear, Species Specificity}, issn = {0028-0836}, author = {Lerner, M R and Boyle, J A and Mount, S M and Wolin, S L and Steitz, J A} }