@misc{9894,
  abstract     = {Orthologous families (OFs) derived by MCL clustering of OGs. (CSV 189 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 18 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808826.v1},
  year         = {2019},
}

@misc{9895,
  abstract     = {Additional information on proteins from OG1. (CSV 30 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 19 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808835.v1},
  year         = {2019},
}

@misc{9896,
  abstract     = {Summary of the analysed genomes. (CSV 24 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 1 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808841.v1},
  year         = {2019},
}

@article{6898,
  abstract     = {Background

Chlamydia are ancient intracellular pathogens with reduced, though strikingly conserved genome. Despite their parasitic lifestyle and isolated intracellular environment, these bacteria managed to avoid accumulation of deleterious mutations leading to subsequent genome degradation characteristic for many parasitic bacteria.
Results

We report pan-genomic analysis of sixteen species from genus Chlamydia including identification and functional annotation of orthologous genes, and characterization of gene gains, losses, and rearrangements. We demonstrate the overall genome stability of these bacteria as indicated by a large fraction of common genes with conserved genomic locations. On the other hand, extreme evolvability is confined to several paralogous gene families such as polymorphic membrane proteins and phospholipase D, and likely is caused by the pressure from the host immune system.
Conclusions

This combination of a large, conserved core genome and a small, evolvable periphery likely reflect the balance between the selective pressure towards genome reduction and the need to adapt to escape from the host immunity.},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  issn         = {1471-2164},
  journal      = {BMC Genomics},
  number       = {1},
  publisher    = {BioMed Central},
  title        = {{Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.1186/s12864-019-6059-5},
  volume       = {20},
  year         = {2019},
}

@misc{9898,
  abstract     = {All polyN tracts of length 5 or more nucleotides in sequences of genes from OG1. Sequences were extracted and scanned prior to automatic correction for frameshifts implemented in the RAST pipeline. (CSV 133 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 21 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808859.v1},
  year         = {2019},
}

@misc{9897,
  abstract     = {Frameshift and nonsense mutations near homopolymeric tracts of OG1 genes. Only 374 genes with typical length and domain composition were considered. (CSV 6 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 20 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808850.v1},
  year         = {2019},
}

@misc{9901,
  abstract     = {Clusters of Orthologous Genes (COGs) and corresponding functional categories assigned to OGs. (CSV 117 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 9 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808907.v1},
  year         = {2019},
}

@misc{9899,
  abstract     = {Summary of orthologous groups (OGs) for 227 genomes of genus Chlamydia. (CSV 362 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 2 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808865.v1},
  year         = {2019},
}

@misc{9900,
  abstract     = {Pan-genome statistics by species. (CSV 3 kb)},
  author       = {Sigalova, Olga M. and Chaplin, Andrei V. and Bochkareva, Olga and Shelyakin, Pavel V. and Filaretov, Vsevolod A. and Akkuratov, Evgeny E. and Burskaia, Valentina and Gelfand, Mikhail S.},
  publisher    = {Springer Nature},
  title        = {{Additional file 5 of Chlamydia pan-genomic analysis reveals balance between host adaptation and selective pressure to genome reduction}},
  doi          = {10.6084/m9.figshare.9808886.v1},
  year         = {2019},
}

@article{6419,
  abstract     = {Characterizing the fitness landscape, a representation of fitness for a large set of genotypes, is key to understanding how genetic information is interpreted to create functional organisms. Here we determined the evolutionarily-relevant segment of the fitness landscape of His3, a gene coding for an enzyme in the histidine synthesis pathway, focusing on combinations of amino acid states found at orthologous sites of extant species. Just 15% of amino acids found in yeast His3 orthologues were always neutral while the impact on fitness of the remaining 85% depended on the genetic background. Furthermore, at 67% of sites, amino acid replacements were under sign epistasis, having both strongly positive and negative effect in different genetic backgrounds. 46% of sites were under reciprocal sign epistasis. The fitness impact of amino acid replacements was influenced by only a few genetic backgrounds but involved interaction of multiple sites, shaping a rugged fitness landscape in which many of the shortest paths between highly fit genotypes are inaccessible.},
  author       = {Pokusaeva, Victoria and Usmanova, Dinara R. and Putintseva, Ekaterina V. and Espinar, Lorena and Sarkisyan, Karen and Mishin, Alexander S. and Bogatyreva, Natalya S. and Ivankov, Dmitry and Akopyan, Arseniy and Avvakumov, Sergey and Povolotskaya, Inna S. and Filion, Guillaume J. and Carey, Lucas B. and Kondrashov, Fyodor},
  issn         = {1553-7404},
  journal      = {PLoS Genetics},
  number       = {4},
  publisher    = {Public Library of Science},
  title        = {{An experimental assay of the interactions of amino acids from orthologous sequences shaping a complex fitness landscape}},
  doi          = {10.1371/journal.pgen.1008079},
  volume       = {15},
  year         = {2019},
}

@misc{9790,
  author       = {Pokusaeva, Victoria and Usmanova, Dinara R. and Putintseva, Ekaterina V. and Espinar, Lorena and Sarkisyan, Karen and Mishin, Alexander S. and Bogatyreva, Natalya S. and Ivankov, Dmitry and Akopyan, Arseniy and Avvakumov, Sergey and Povolotskaya, Inna S. and Filion, Guillaume J. and Carey, Lucas B. and Kondrashov, Fyodor},
  publisher    = {Public Library of Science},
  title        = {{A statistical summary of segment libraries and sequencing results}},
  doi          = {10.1371/journal.pgen.1008079.s011},
  year         = {2019},
}

@misc{9797,
  author       = {Pokusaeva, Victoria and Usmanova, Dinara R. and Putintseva, Ekaterina V. and Espinar, Lorena and Sarkisyan, Karen and Mishin, Alexander S. and Bogatyreva, Natalya S. and Ivankov, Dmitry and Akopyan, Arseniy and Povolotskaya, Inna S. and Filion, Guillaume J. and Carey, Lucas B. and Kondrashov, Fyodor},
  publisher    = {Public Library of Science},
  title        = {{A statistical summary of segment libraries and sequencing results}},
  doi          = {10.1371/journal.pgen.1008079.s011},
  year         = {2019},
}

@misc{9789,
  author       = {Pokusaeva, Victoria and Usmanova, Dinara R. and Putintseva, Ekaterina V. and Espinar, Lorena and Sarkisyan, Karen and Mishin, Alexander S. and Bogatyreva, Natalya S. and Ivankov, Dmitry and Akopyan, Arseniy and Avvakumov, Sergey and Povolotskaya, Inna S. and Filion, Guillaume J. and Carey, Lucas B. and Kondrashov, Fyodor},
  publisher    = {Public Library of Science},
  title        = {{Multiple alignment of His3 orthologues}},
  doi          = {10.1371/journal.pgen.1008079.s010},
  year         = {2019},
}

@article{279,
  abstract     = {Background: Natural selection shapes cancer genomes. Previous studies used signatures of positive selection to identify genes driving malignant transformation. However, the contribution of negative selection against somatic mutations that affect essential tumor functions or specific domains remains a controversial topic. Results: Here, we analyze 7546 individual exomes from 26 tumor types from TCGA data to explore the portion of the cancer exome under negative selection. Although we find most of the genes neutrally evolving in a pan-cancer framework, we identify essential cancer genes and immune-exposed protein regions under significant negative selection. Moreover, our simulations suggest that the amount of negative selection is underestimated. We therefore choose an empirical approach to identify genes, functions, and protein regions under negative selection. We find that expression and mutation status of negatively selected genes is indicative of patient survival. Processes that are most strongly conserved are those that play fundamental cellular roles such as protein synthesis, glucose metabolism, and molecular transport. Intriguingly, we observe strong signals of selection in the immunopeptidome and proteins controlling peptide exposition, highlighting the importance of immune surveillance evasion. Additionally, tumor type-specific immune activity correlates with the strength of negative selection on human epitopes. Conclusions: In summary, our results show that negative selection is a hallmark of cell essentiality and immune response in cancer. The functional domains identified could be exploited therapeutically, ultimately allowing for the development of novel cancer treatments.},
  author       = {Zapata, Luis and Pich, Oriol and Serrano, Luis and Kondrashov, Fyodor and Ossowski, Stephan and Schaefer, Martin},
  journal      = {Genome Biology},
  publisher    = {BioMed Central},
  title        = {{Negative selection in tumor genome evolution acts on essential cellular functions and the immunopeptidome}},
  doi          = {10.1186/s13059-018-1434-0},
  volume       = {19},
  year         = {2018},
}

@misc{13059,
  abstract     = {This dataset contains a GitHub repository containing all the data, analysis, Nextflow workflows and Jupyter notebooks to replicate the manuscript titled "Fast and accurate large multiple sequence alignments with a root-to-leaf regressive method".
It also contains the Multiple Sequence Alignments (MSAs) generated and well as the main figures and tables from the manuscript.
The repository is also available at GitHub (https://github.com/cbcrg/dpa-analysis) release `v1.2`.
For details on how to use the regressive alignment algorithm, see the T-Coffee software suite (https://github.com/cbcrg/tcoffee).},
  author       = {Garriga, Edgar and di Tommaso, Paolo and Magis, Cedrik and Erb, Ionas and Mansouri, Leila and Baltzis, Athanasios and Laayouni, Hafid and Kondrashov, Fyodor and Floden, Evan and Notredame, Cedric},
  publisher    = {Zenodo},
  title        = {{Fast and accurate large multiple sequence alignments with a root-to-leaf regressive method}},
  doi          = {10.5281/ZENODO.2025846},
  year         = {2018},
}

@misc{9811,
  abstract     = {This document contains additional supporting evidence presented as supplemental tables. (XLSX 50Â kb)},
  author       = {Zapata, Luis and Pich, Oriol and Serrano, Luis and Kondrashov, Fyodor and Ossowski, Stephan and Schaefer, Martin},
  publisher    = {Springer Nature},
  title        = {{Additional file 1: Of negative selection in tumor genome evolution acts on essential cellular functions and the immunopeptidome}},
  doi          = {10.6084/m9.figshare.6401390.v1},
  year         = {2018},
}

@misc{9812,
  abstract     = {This document contains the full list of genes with their respective significance and dN/dS values. (TXT 4499Â kb)},
  author       = {Zapata, Luis and Pich, Oriol and Serrano, Luis and Kondrashov, Fyodor and Ossowski, Stephan and Schaefer, Martin},
  publisher    = {Springer Nature},
  title        = {{Additional file 2: Of negative selection in tumor genome evolution acts on essential cellular functions and the immunopeptidome}},
  doi          = {10.6084/m9.figshare.6401414.v1},
  year         = {2018},
}

@article{5780,
  abstract     = {Bioluminescence is found across the entire tree of life, conferring a spectacular set of visually oriented functions from attracting mates to scaring off predators. Half a dozen different luciferins, molecules that emit light when enzymatically oxidized, are known. However, just one biochemical pathway for luciferin biosynthesis has been described in full, which is found only in bacteria. Here, we report identification of the fungal luciferase and three other key enzymes that together form the biosynthetic cycle of the fungal luciferin from caffeic acid, a simple and widespread metabolite. Introduction of the identified genes into the genome of the yeast Pichia pastoris along with caffeic acid biosynthesis genes resulted in a strain that is autoluminescent in standard media. We analyzed evolution of the enzymes of the luciferin biosynthesis cycle and found that fungal bioluminescence emerged through a series of events that included two independent gene duplications. The retention of the duplicated enzymes of the luciferin pathway in nonluminescent fungi shows that the gene duplication was followed by functional sequence divergence of enzymes of at least one gene in the biosynthetic pathway and suggests that the evolution of fungal bioluminescence proceeded through several closely related stepping stone nonluminescent biochemical reactions with adaptive roles. The availability of a complete eukaryotic luciferin biosynthesis pathway provides several applications in biomedicine and bioengineering.},
  author       = {Kotlobay, Alexey A. and Sarkisyan, Karen and Mokrushina, Yuliana A. and Marcet-Houben, Marina and Serebrovskaya, Ekaterina O. and Markina, Nadezhda M. and Gonzalez Somermeyer, Louisa and Gorokhovatsky, Andrey Y. and Vvedensky, Andrey and Purtov, Konstantin V. and Petushkov, Valentin N. and Rodionova, Natalja S. and Chepurnyh, Tatiana V. and Fakhranurova, Liliia and Guglya, Elena B. and Ziganshin, Rustam and Tsarkova, Aleksandra S. and Kaskova, Zinaida M. and Shender, Victoria and Abakumov, Maxim and Abakumova, Tatiana O. and Povolotskaya, Inna S. and Eroshkin, Fedor M. and Zaraisky, Andrey G. and Mishin, Alexander S. and Dolgov, Sergey V. and Mitiouchkina, Tatiana Y. and Kopantzev, Eugene P. and Waldenmaier, Hans E. and Oliveira, Anderson G. and Oba, Yuichi and Barsova, Ekaterina and Bogdanova, Ekaterina A. and Gabaldón, Toni and Stevani, Cassius V. and Lukyanov, Sergey and Smirnov, Ivan V. and Gitelson, Josef I. and Kondrashov, Fyodor and Yampolsky, Ilia V.},
  issn         = {0027-8424},
  journal      = {Proceedings of the National Academy of Sciences of the United States of America},
  number       = {50},
  pages        = {12728--12732},
  publisher    = {National Academy of Sciences},
  title        = {{Genetically encodable bioluminescent system from fungi}},
  doi          = {10.1073/pnas.1803615115},
  volume       = {115},
  year         = {2018},
}

@article{5995,
  abstract     = {Motivation
Computational prediction of the effect of mutations on protein stability is used by researchers in many fields. The utility of the prediction methods is affected by their accuracy and bias. Bias, a systematic shift of the predicted change of stability, has been noted as an issue for several methods, but has not been investigated systematically. Presence of the bias may lead to misleading results especially when exploring the effects of combination of different mutations.

Results
Here we use a protocol to measure the bias as a function of the number of introduced mutations. It is based on a self-consistency test of the reciprocity the effect of a mutation. An advantage of the used approach is that it relies solely on crystal structures without experimentally measured stability values. We applied the protocol to four popular algorithms predicting change of protein stability upon mutation, FoldX, Eris, Rosetta and I-Mutant, and found an inherent bias. For one program, FoldX, we manage to substantially reduce the bias using additional relaxation by Modeller. Authors using algorithms for predicting effects of mutations should be aware of the bias described here.},
  author       = {Usmanova, Dinara R and Bogatyreva, Natalya S and Ariño Bernad, Joan and Eremina, Aleksandra A and Gorshkova, Anastasiya A and Kanevskiy, German M and Lonishin, Lyubov R and Meister, Alexander V and Yakupova, Alisa G and Kondrashov, Fyodor and Ivankov, Dmitry},
  issn         = {1367-4811},
  journal      = {Bioinformatics},
  number       = {21},
  pages        = {3653--3658},
  publisher    = {Oxford University Press },
  title        = {{Self-consistency test reveals systematic bias in programs for prediction change of stability upon mutation}},
  doi          = {10.1093/bioinformatics/bty340},
  volume       = {34},
  year         = {2018},
}

@article{384,
  abstract     = {Can orthologous proteins differ in terms of their ability to be secreted? To answer this question, we investigated the distribution of signal peptides within the orthologous groups of Enterobacterales. Parsimony analysis and sequence comparisons revealed a large number of signal peptide gain and loss events, in which signal peptides emerge or disappear in the course of evolution. Signal peptide losses prevail over gains, an effect which is especially pronounced in the transition from the free-living or commensal to the endosymbiotic lifestyle. The disproportionate decline in the number of signal peptide-containing proteins in endosymbionts cannot be explained by the overall reduction of their genomes. Signal peptides can be gained and lost either by acquisition/elimination of the corresponding N-terminal regions or by gradual accumulation of mutations. The evolutionary dynamics of signal peptides in bacterial proteins represents a powerful mechanism of functional diversification.},
  author       = {Hönigschmid, Peter and Bykova, Nadya and Schneider, René and Ivankov, Dmitry and Frishman, Dmitrij},
  journal      = {Genome Biology and Evolution},
  number       = {3},
  pages        = {928 -- 938},
  publisher    = {Oxford University Press},
  title        = {{Evolutionary interplay between symbiotic relationships and patterns of signal peptide gain and loss}},
  doi          = {10.1093/gbe/evy049},
  volume       = {10},
  year         = {2018},
}

