@article {743, title = {Deciphering Genomic Heterogeneity and the Internal Composition of Tumour Activities through a Hierarchical Factorisation Model}, journal = {Mathematics}, volume = {9}, year = {2021}, month = {Jan-11-2021}, pages = {2833}, doi = {10.3390/math9212833}, url = {https://www.mdpi.com/2227-7390/9/21/2833https://www.mdpi.com/2227-7390/9/21/2833/pdf}, author = {Carbonell-Caballero, Jos{\'e} and L{\'o}pez-Qu{\'\i}lez, Antonio and Conesa, David and Dopazo, Joaquin} } @article {403, title = {A comparison of mechanistic signaling pathway activity analysis methods.}, journal = {Brief Bioinform}, volume = {20}, year = {2019}, month = {2019 09 27}, pages = {1655-1668}, abstract = {

Understanding the aspects of cell functionality that account for disease mechanisms or drug modes of action is a main challenge for precision medicine. Classical gene-based approaches ignore the modular nature of most human traits, whereas conventional pathway enrichment approaches produce only illustrative results of limited practical utility. Recently, a family of new methods has emerged that change the focus from the whole pathways to the definition of elementary subpathways within them that have any mechanistic significance and to the study of their activities. Thus, mechanistic pathway activity (MPA) methods constitute a new paradigm that allows recoding poorly informative genomic measurements into cell activity quantitative values and relate them to phenotypes. Here we provide a review on the MPA methods available and explain their contribution to systems medicine approaches for addressing challenges in the diagnostic and treatment of complex diseases.

}, keywords = {Algorithms, Humans, Postmortem Changes, Signal Transduction, Systems biology, Transcriptome}, issn = {1477-4054}, doi = {10.1093/bib/bby040}, author = {Amadoz, Alicia and Hidalgo, Marta R and Cubuk, Cankut and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {422, title = {Differential metabolic activity and discovery of therapeutic targets using summarized metabolic pathway models.}, journal = {NPJ Syst Biol Appl}, volume = {5}, year = {2019}, month = {2019}, pages = {7}, abstract = {

In spite of the increasing availability of genomic and transcriptomic data, there is still a gap between the detection of perturbations in gene expression and the understanding of their contribution to the molecular mechanisms that ultimately account for the phenotype studied. Alterations in the metabolism are behind the initiation and progression of many diseases, including cancer. The wealth of available knowledge on metabolic processes can therefore be used to derive mechanistic models that link gene expression perturbations to changes in metabolic activity that provide relevant clues on molecular mechanisms of disease and drug modes of action (MoA). In particular, pathway modules, which recapitulate the main aspects of metabolism, are especially suitable for this type of modeling. We present Metabolizer, a web-based application that offers an intuitive, easy-to-use interactive interface to analyze differences in pathway metabolic module activities that can also be used for class prediction and in silico prediction of knock-out (KO) effects. Moreover, Metabolizer can automatically predict the optimal KO intervention for restoring a diseased phenotype. We provide different types of validations of some of the predictions made by Metabolizer. Metabolizer is a web tool that allows understanding molecular mechanisms of disease or the MoA of drugs within the context of the metabolism by using gene expression measurements. In addition, this tool automatically suggests potential therapeutic targets for individualized therapeutic interventions.

}, keywords = {Computational Biology, Computer Simulation, Drug discovery, Gene Regulatory Networks, Humans, Internet, Metabolic Networks and Pathways, Models, Biological, Neoplasms, Phenotype, Software, Transcriptome}, issn = {2056-7189}, doi = {10.1038/s41540-019-0087-2}, author = {Cubuk, Cankut and Hidalgo, Marta R and Amadoz, Alicia and Rian, Kinza and Salavert, Francisco and Pujana, Miguel A and Mateo, Francesca and Herranz, Carmen and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {397, title = {The effects of death and post-mortem cold ischemia on human tissue transcriptomes.}, journal = {Nat Commun}, volume = {9}, year = {2018}, month = {2018 02 13}, pages = {490}, abstract = {

Post-mortem tissues samples are a key resource for investigating patterns of gene expression. However, the processes triggered by death and the post-mortem interval (PMI) can significantly alter physiologically normal RNA levels. We investigate the impact of PMI on gene expression using data from multiple tissues of post-mortem donors obtained from the GTEx project. We find that many genes change expression over relatively short PMIs in a tissue-specific manner, but this potentially confounding effect in a biological analysis can be minimized by taking into account appropriate covariates. By comparing ante- and post-mortem blood samples, we identify the cascade of transcriptional events triggered by death of the organism. These events do not appear to simply reflect stochastic variation resulting from mRNA degradation, but active and ongoing regulation of transcription. Finally, we develop a model to predict the time since death from the analysis of the transcriptome of a few readily accessible tissues.

}, keywords = {Blood, Cold Ischemia, Death, Female, gene expression, Humans, Models, Biological, Postmortem Changes, RNA, Messenger, Stochastic Processes, Transcriptome}, issn = {2041-1723}, doi = {10.1038/s41467-017-02772-x}, author = {Ferreira, Pedro G and Mu{\~n}oz-Aguirre, Manuel and Reverter, Ferran and S{\'a} Godinho, Caio P and Sousa, Abel and Amadoz, Alicia and Sodaei, Reza and Hidalgo, Marta R and Pervouchine, Dmitri and Carbonell-Caballero, Jos{\'e} and Nurtdinov, Ramil and Breschi, Alessandra and Amador, Raziel and Oliveira, Patr{\'\i}cia and Cubuk, Cankut and Curado, Jo{\~a}o and Aguet, Fran{\c c}ois and Oliveira, Carla and Dopazo, Joaquin and Sammeth, Michael and Ardlie, Kristin G and Guig{\'o}, Roderic} } @article {405, title = {Gene Expression Integration into Pathway Modules Reveals a Pan-Cancer Metabolic Landscape.}, journal = {Cancer Res}, volume = {78}, year = {2018}, month = {2018 11 01}, pages = {6059-6072}, abstract = {

Metabolic reprogramming plays an important role in cancer development and progression and is a well-established hallmark of cancer. Despite its inherent complexity, cellular metabolism can be decomposed into functional modules that represent fundamental metabolic processes. Here, we performed a pan-cancer study involving 9,428 samples from 25 cancer types to reveal metabolic modules whose individual or coordinated activity predict cancer type and outcome, in turn highlighting novel therapeutic opportunities. Integration of gene expression levels into metabolic modules suggests that the activity of specific modules differs between cancers and the corresponding tissues of origin. Some modules may cooperate, as indicated by the positive correlation of their activity across a range of tumors. The activity of many metabolic modules was significantly associated with prognosis at a stronger magnitude than any of their constituent genes. Thus, modules may be classified as tumor suppressors and oncomodules according to their potential impact on cancer progression. Using this modeling framework, we also propose novel potential therapeutic targets that constitute alternative ways of treating cancer by inhibiting their reprogrammed metabolism. Collectively, this study provides an extensive resource of predicted cancer metabolic profiles and dependencies. Combining gene expression with metabolic modules identifies molecular mechanisms of cancer undetected on an individual gene level and allows discovery of new potential therapeutic targets. .

}, keywords = {Cell Line, Tumor, Cluster Analysis, Disease Progression, Gene Expression Profiling, Gene Expression Regulation, Neoplastic, Gene Regulatory Networks, Humans, Kaplan-Meier Estimate, Metabolome, mutation, Neoplasms, Oncogenes, Phenotype, Prognosis, RNA, Small Interfering, Sequence Analysis, RNA, Transcriptome, Treatment Outcome}, issn = {1538-7445}, doi = {10.1158/0008-5472.CAN-17-2705}, author = {Cubuk, Cankut and Hidalgo, Marta R and Amadoz, Alicia and Pujana, Miguel A and Mateo, Francesca and Herranz, Carmen and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {398, title = {Genomics of the origin and evolution of Citrus.}, journal = {Nature}, volume = {554}, year = {2018}, month = {2018 02 15}, pages = {311-316}, abstract = {

The genus Citrus, comprising some of the most widely cultivated fruit crops worldwide, includes an uncertain number of species. Here we describe ten natural citrus species, using genomic, phylogenetic and biogeographic analyses of 60 accessions representing diverse citrus germ plasms, and propose that citrus diversified during the late Miocene epoch through a rapid southeast Asian radiation that correlates with a marked weakening of the monsoons. A second radiation enabled by migration across the Wallace line gave rise to the Australian limes in the early Pliocene epoch. Further identification and analyses of hybrids and admixed genomes provides insights into the genealogy of major commercial cultivars of citrus. Among mandarins and sweet orange, we find an extensive network of relatedness that illuminates the domestication of these groups. Widespread pummelo admixture among these mandarins and its correlation with fruit size and acidity suggests a plausible role of pummelo introgression in the selection of palatable mandarins. This work provides a new evolutionary framework for the genus Citrus.

}, keywords = {Asia, Southeastern, Biodiversity, citrus, Crop Production, Evolution, Molecular, Genetic Speciation, Genome, Plant, Genomics, Haplotypes, Heterozygote, History, Ancient, Human Migration, Hybridization, Genetic, Phylogeny}, issn = {1476-4687}, doi = {10.1038/nature25447}, author = {Wu, Guohong Albert and Terol, Javier and Iba{\~n}ez, Victoria and L{\'o}pez-Garc{\'\i}a, Antonio and P{\'e}rez-Rom{\'a}n, Estela and Borred{\'a}, Carles and Domingo, Concha and Tadeo, Francisco R and Carbonell-Caballero, Jos{\'e} and Alonso, Roberto and Curk, Franck and Du, Dongliang and Ollitrault, Patrick and Roose, Mikeal L and Dopazo, Joaquin and Gmitter, Frederick G and Rokhsar, Daniel S and Talon, Manuel} } @article {404, title = {Models of cell signaling uncover molecular mechanisms of high-risk neuroblastoma and predict disease outcome.}, journal = {Biol Direct}, volume = {13}, year = {2018}, month = {2018 08 22}, pages = {16}, abstract = {

BACKGROUND: Despite the progress in neuroblastoma therapies the mortality of high-risk patients is still high (40-50\%) and the molecular basis of the disease remains poorly known. Recently, a mathematical model was used to demonstrate that the network regulating stress signaling by the c-Jun N-terminal kinase pathway played a crucial role in survival of patients with neuroblastoma irrespective of their MYCN amplification status. This demonstrates the enormous potential of computational models of biological modules for the discovery of underlying molecular mechanisms of diseases.

RESULTS: Since signaling is known to be highly relevant in cancer, we have used a computational model of the whole cell signaling network to understand the molecular determinants of bad prognostic in neuroblastoma. Our model produced a comprehensive view of the molecular mechanisms of neuroblastoma tumorigenesis and progression.

CONCLUSION: We have also shown how the activity of signaling circuits can be considered a reliable model-based prognostic biomarker.

REVIEWERS: This article was reviewed by Tim Beissbarth, Wenzhong Xiao and Joanna Polanska. For the full reviews, please go to the Reviewers{\textquoteright} comments section.

}, keywords = {Computational Biology, Gene Expression Regulation, Neoplastic, Humans, JNK Mitogen-Activated Protein Kinases, Models, Theoretical, Neuroblastoma, Signal Transduction}, issn = {1745-6150}, doi = {10.1186/s13062-018-0219-4}, author = {Hidalgo, Marta R and Amadoz, Alicia and Cubuk, Cankut and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {407, title = {The modular network structure of the mutational landscape of Acute Myeloid Leukemia.}, journal = {PLoS One}, volume = {13}, year = {2018}, month = {2018}, pages = {e0202926}, abstract = {

Acute myeloid leukemia (AML) is associated with the sequential accumulation of acquired genetic alterations. Although at diagnosis cytogenetic alterations are frequent in AML, roughly 50\% of patients present an apparently normal karyotype (NK), leading to a highly heterogeneous prognosis. Due to this significant heterogeneity, it has been suggested that different molecular mechanisms may trigger the disease with diverse prognostic implications. We performed whole-exome sequencing (WES) of tumor-normal matched samples of de novo AML-NK patients lacking mutations in NPM1, CEBPA or FLT3-ITD to identify new gene mutations with potential prognostic and therapeutic relevance to patients with AML. Novel candidate-genes, together with others previously described, were targeted resequenced in an independent cohort of 100 de novo AML patients classified in the cytogenetic intermediate-risk (IR) category. A mean of 4.89 mutations per sample were detected in 73 genes, 35 of which were mutated in more than one patient. After a network enrichment analysis, we defined a single in silico model and established a set of seed-genes that may trigger leukemogenesis in patients with normal karyotype. The high heterogeneity of gene mutations observed in AML patients suggested that a specific alteration could not be as essential as the interaction of deregulated pathways.

}, keywords = {Adult, Aged, Cytodiagnosis, Female, Gene Regulatory Networks, Genetic Association Studies, Genetic Heterogeneity, Humans, Karyotype, Leukemia, Myeloid, Acute, Male, Middle Aged, mutation, Neoplasm Proteins, Nucleophosmin, Prognosis, whole exome sequencing}, issn = {1932-6203}, doi = {10.1371/journal.pone.0202926}, author = {Ib{\'a}{\~n}ez, Mariam and Carbonell-Caballero, Jos{\'e} and Such, Esperanza and Garc{\'\i}a-Alonso, Luz and Liquori, Alessandro and L{\'o}pez-Pav{\'\i}a, Mar{\'\i}a and LLop, Marta and Alonso, Carmen and Barrag{\'a}n, Eva and G{\'o}mez-Segu{\'\i}, In{\'e}s and Neef, Alexander and Herv{\'a}s, David and Montesinos, Pau and Sanz, Guillermo and Sanz, Miguel Angel and Dopazo, Joaquin and Cervera, Jos{\'e}} } @article {434, title = {High throughput estimation of functional cell activities reveals disease mechanisms and predicts relevant clinical outcomes.}, journal = {Oncotarget}, volume = {8}, year = {2017}, month = {2017 Jan 17}, pages = {5160-5178}, abstract = {

Understanding the aspects of the cell functionality that account for disease or drug action mechanisms is a main challenge for precision medicine. Here we propose a new method that models cell signaling using biological knowledge on signal transduction. The method recodes individual gene expression values (and/or gene mutations) into accurate measurements of changes in the activity of signaling circuits, which ultimately constitute high-throughput estimations of cell functionalities caused by gene activity within the pathway. Moreover, such estimations can be obtained either at cohort-level, in case/control comparisons, or personalized for individual patients. The accuracy of the method is demonstrated in an extensive analysis involving 5640 patients from 12 different cancer types. Circuit activity measurements not only have a high diagnostic value but also can be related to relevant disease outcomes such as survival, and can be used to assess therapeutic interventions.

}, keywords = {Computational Biology, gene expression, Gene Regulatory Networks, Humans, mutation, Neoplasms, Precision Medicine, Sequence Analysis, RNA, Signal Transduction}, issn = {1949-2553}, doi = {10.18632/oncotarget.14107}, author = {Hidalgo, Marta R and Cubuk, Cankut and Amadoz, Alicia and Salavert, Francisco and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {388, title = {Reference genome assessment from a population scale perspective: an accurate profile of variability and noise.}, journal = {Bioinformatics}, volume = {33}, year = {2017}, month = {2017 Nov 15}, pages = {3511-3517}, abstract = {

Motivation: Current plant and animal genomic studies are often based on newly assembled genomes that have not been properly consolidated. In this scenario, misassembled regions can easily lead to false-positive findings. Despite quality control scores are included within genotyping protocols, they are usually employed to evaluate individual sample quality rather than reference sequence reliability. We propose a statistical model that combines quality control scores across samples in order to detect incongruent patterns at every genomic region. Our model is inherently robust since common artifact signals are expected to be shared between independent samples over misassembled regions of the genome.

Results: The reliability of our protocol has been extensively tested through different experiments and organisms with accurate results, improving state-of-the-art methods. Our analysis demonstrates synergistic relations between quality control scores and allelic variability estimators, that improve the detection of misassembled regions, and is able to find strong artifact signals even within the human reference assembly. Furthermore, we demonstrated how our model can be trained to properly rank the confidence of a set of candidate variants obtained from new independent samples.

Availability and implementation: This tool is freely available at http://gitlab.com/carbonell/ces.

Contact: jcarbonell.cipf@gmail.com or joaquin.dopazo@juntadeandalucia.es.

Supplementary information: Supplementary data are available at Bioinformatics online.

}, keywords = {Animals, Genetic Variation, Genome, Genomics, Genotype, Humans, Models, Statistical, Quality Control, Reproducibility of Results, Software}, issn = {1367-4811}, doi = {10.1093/bioinformatics/btx482}, url = {https://academic.oup.com/bioinformatics/article-lookup/doi/10.1093/bioinformatics/btx482}, author = {Carbonell-Caballero, Jos{\'e} and Amadoz, Alicia and Alonso, Roberto and Hidalgo, Marta R and Cubuk, Cankut and Conesa, David and L{\'o}pez-Qu{\'\i}lez, Antonio and Dopazo, Joaquin} } @article {1203, title = {Actionable pathways: interactive discovery of therapeutic targets using signaling pathway models.}, journal = {Nucleic acids research}, year = {2016}, month = {2016 May 2}, abstract = {The discovery of actionable targets is crucial for targeted therapies and is also a constituent part of the drug discovery process. The success of an intervention over a target depends critically on its contribution, within the complex network of gene interactions, to the cellular processes responsible for disease progression or therapeutic response. Here we present PathAct, a web server that predicts the effect that interventions over genes (inhibitions or activations that simulate knock-outs, drug treatments or over-expressions) can have over signal transmission within signaling pathways and, ultimately, over the cell functionalities triggered by them. PathAct implements an advanced graphical interface that provides a unique interactive working environment in which the suitability of potentially actionable genes, that could eventually become drug targets for personalized or individualized therapies, can be easily tested. The PathAct tool can be found at: http://pathact.babelomics.org.}, keywords = {actionable genes, Disease mechanism, drug action mechanism, Drug discovery, pathway analysis, personalized medicine, signalling, therapeutic targets}, issn = {1362-4962}, doi = {10.1093/nar/gkw369}, url = {http://nar.oxfordjournals.org/content/early/2016/05/02/nar.gkw369.full}, author = {Salavert, Francisco and Hidago, Marta R and Amadoz, Alicia and Cubuk, Cankut and Medina, Ignacio and Crespo, Daniel and Carbonell-Caballero, Jos{\'e} and Joaqu{\'\i}n Dopazo} } @article {453, title = {The Mutational Landscape of Acute Promyelocytic Leukemia Reveals an Interacting Network of Co-Occurrences and Recurrent Mutations.}, journal = {PLoS One}, volume = {11}, year = {2016}, month = {2016}, pages = {e0148346}, abstract = {

Preliminary Acute Promyelocytic Leukemia (APL) whole exome sequencing (WES) studies have identified a huge number of somatic mutations affecting more than a hundred different genes mainly in a non-recurrent manner, suggesting that APL is a heterogeneous disease with secondary relevant changes not yet defined. To extend our knowledge of subtle genetic alterations involved in APL that might cooperate with PML/RARA in the leukemogenic process, we performed a comprehensive analysis of somatic mutations in APL combining WES with sequencing of a custom panel of targeted genes by next-generation sequencing. To select a reduced subset of high confidence candidate driver genes, further in silico analysis were carried out. After prioritization and network analysis we found recurrent deleterious mutations in 8 individual genes (STAG2, U2AF1, SMC1A, USP9X, IKZF1, LYN, MYCBP2 and PTPN11) with a strong potential of being involved in APL pathogenesis. Our network analysis of multiple mutations provides a reliable approach to prioritize genes for additional analysis, improving our knowledge of the leukemogenesis interactome. Additionally, we have defined a functional module in the interactome of APL. The hypothesis is that the number, or the specific combinations, of mutations harbored in each patient might not be as important as the disturbance caused in biological key functions, triggered by several not necessarily recurrent mutations.

}, keywords = {Exome, Gene Regulatory Networks, Genome, Human, Humans, INDEL Mutation, Leukemia, Promyelocytic, Acute, mutation, Mutation Rate, Polymorphism, Single Nucleotide, Reproducibility of Results}, issn = {1932-6203}, doi = {10.1371/journal.pone.0148346}, author = {Ib{\'a}{\~n}ez, Mariam and Carbonell-Caballero, Jos{\'e} and Garc{\'\i}a-Alonso, Luz and Such, Esperanza and Jim{\'e}nez-Almaz{\'a}n, Jorge and Vidal, Enrique and Barrag{\'a}n, Eva and L{\'o}pez-Pav{\'\i}a, Mar{\'\i}a and LLop, Marta and Mart{\'\i}n, Iv{\'a}n and G{\'o}mez-Segu{\'\i}, In{\'e}s and Montesinos, Pau and Sanz, Miguel A and Dopazo, Joaquin and Cervera, Jos{\'e}} } @article {1225, title = {The pan-cancer pathological regulatory landscape.}, journal = {Scientific reports}, volume = {6}, year = {2016}, month = {2016 Dec 21}, pages = {39709}, abstract = {Dysregulation of the normal gene expression program is the cause of a broad range of diseases, including cancer. Detecting the specific perturbed regulators that have an effect on the generation and the development of the disease is crucial for understanding the disease mechanism and for taking decisions on efficient preventive and curative therapies. Moreover, detecting such perturbations at the patient level is even more important from the perspective of personalized medicine. We applied the Transcription Factor Target Enrichment Analysis, a method that detects the activity of transcription factors based on the quantification of the collective transcriptional activation of their targets, to a large collection of 5607 cancer samples covering eleven cancer types. We produced for the first time a comprehensive catalogue of altered transcription factor activities in cancer, a considerable number of them significantly associated to patient{\textquoteright}s survival. Moreover, we described several interesting TFs whose activity do not change substantially in the cancer with respect to the normal tissue but ultimately play an important role in patient prognostic determination, which suggest they might be promising therapeutic targets. An additional advantage of this method is that it allows obtaining personalized TF activity estimations for individual patients.}, issn = {2045-2322}, doi = {10.1038/srep39709}, url = {http://www.nature.com/articles/srep39709}, author = {Falco, Matias M and Bleda, Marta and Carbonell-Caballero, Jos{\'e} and Joaqu{\'\i}n Dopazo} } @article {435, title = {The pan-cancer pathological regulatory landscape}, journal = {Scientific Reports}, volume = {6}, year = {2016}, month = {Jan-12-2016}, doi = {10.1038/srep39709}, url = {http://www.nature.com/articles/srep39709http://www.nature.com/articles/srep39709.pdfhttp://www.nature.com/articles/srep39709.pdfhttp://www.nature.com/articles/srep39709}, author = {Falco, Matias M. and Bleda, Marta and Carbonell-Caballero, Jos{\'e} and Dopazo, Joaquin} } @article {1129, title = {Babelomics 5.0: functional interpretation for new generations of genomic data.}, journal = {Nucleic acids research}, volume = {43}, number = {W1}, year = {2015}, month = {2015 Apr 20}, pages = {W117-W121}, abstract = {Babelomics has been running for more than one decade offering a user-friendly interface for the functional analysis of gene expression and genomic data. Here we present its fifth release, which includes support for Next Generation Sequencing data including gene expression (RNA-seq), exome or genome resequencing. Babelomics has simplified its interface, being now more intuitive. Improved visualization options, such as a genome viewer as well as an interactive network viewer, have been implemented. New technical enhancements at both, client and server sides, makes the user experience faster and more dynamic. Babelomics offers user-friendly access to a full range of methods that cover: (i) primary data analysis, (ii) a variety of tests for different experimental designs and (iii) different enrichment and network analysis algorithms for the interpretation of the results of such tests in the proper functional context. In addition to the public server, local copies of Babelomics can be downloaded and installed. Babelomics is freely available at: http://www.babelomics.org.}, keywords = {babelomics, data integration, gene set analysis, interactome, network analysis, NGS, RNA-seq, Systems biology, transcriptomics}, issn = {1362-4962}, doi = {10.1093/nar/gkv384}, url = {http://nar.oxfordjournals.org/content/43/W1/W117}, author = {Alonso, Roberto and Salavert, Francisco and Garcia-Garcia, Francisco and Carbonell-Caballero, Jos{\'e} and Bleda, Marta and Garc{\'\i}a-Alonso, Luz and Sanchis-Juan, Alba and Perez-Gil, Daniel and Marin-Garcia, Pablo and S{\'a}nchez, Rub{\'e}n and Cubuk, Cankut and Hidalgo, Marta R and Amadoz, Alicia and Hernansaiz-Ballesteros, Rosa D and Alem{\'a}n, Alejandro and T{\'a}rraga, Joaqu{\'\i}n and Montaner, David and Medina, Ignacio and Dopazo, Joaquin} } @article {1132, title = {Combining tumor genome simulation with crowdsourcing to benchmark somatic single-nucleotide-variant detection.}, journal = {Nature methods}, year = {2015}, month = {2015 May 18}, abstract = {The detection of somatic mutations from cancer genome sequences is key to understanding the genetic basis of disease progression, patient survival and response to therapy. Benchmarking is needed for tool assessment and improvement but is complicated by a lack of gold standards, by extensive resource requirements and by difficulties in sharing personal genomic information. To resolve these issues, we launched the ICGC-TCGA DREAM Somatic Mutation Calling Challenge, a crowdsourced benchmark of somatic mutation detection algorithms. Here we report the BAMSurgeon tool for simulating cancer genomes and the results of 248 analyses of three in silico tumors created with it. Different algorithms exhibit characteristic error profiles, and, intriguingly, false positives show a trinucleotide profile very similar to one found in human tumors. Although the three simulated tumors differ in sequence contamination (deviation from normal cell sequence) and in subclonality, an ensemble of pipelines outperforms the best individual pipeline in all cases. BAMSurgeon is available at https://github.com/adamewing/bamsurgeon/.}, keywords = {cancer, NGS, variant calling}, issn = {1548-7105}, doi = {10.1038/nmeth.3407}, url = {http://www.nature.com/nmeth/journal/vaop/ncurrent/full/nmeth.3407.html}, author = {Ewing, Adam D and Houlahan, Kathleen E and Hu, Yin and Ellrott, Kyle and Caloian, Cristian and Yamaguchi, Takafumi N and Bare, J Christopher and P{\textquoteright}ng, Christine and Waggott, Daryl and Sabelnykova, Veronica Y and Kellen, Michael R and Norman, Thea C and Haussler, David and Friend, Stephen H and Stolovitzky, Gustavo and Margolin, Adam A and Stuart, Joshua M and Boutros, Paul C}, editor = {ICGC-TCGA DREAM Somatic Mutation Calling Challenge participants and Liu Xi and Ninad Dewal and Yu Fan and Wenyi Wang and David Wheeler and Andreas Wilm and Grace Hui Ting and Chenhao Li and Denis Bertrand and Niranjan Nagarajan and Qing-Rong Chen and Chih-Hao Hsu and Ying Hu and Chunhua Yan and Warren Kibbe and Daoud Meerzaman and Kristian Cibulskis and Mara Rosenberg and Louis Bergelson and Adam Kiezun and Amie Radenbaugh and Anne-Sophie Sertier and Anthony Ferrari and Laurie Tonton and Kunal Bhutani and Nancy F Hansen and Difei Wang and Lei Song and Zhongwu Lai and Liao, Yang and Shi, Wei and Carbonell-Caballero, Jos{\'e} and Joaqu{\'\i}n Dopazo and Cheryl C K Lau and Justin Guinney} } @article {1121, title = {A phylogenetic analysis of 34 chloroplast genomes elucidates the relationships between wild and domestic species within the genus Citrus.}, journal = {Molecular biology and evolution}, volume = {32}, number = {8}, year = {2015}, month = {2015 Apr 14}, pages = {2015-2035}, abstract = {Citrus genus includes some of the most important cultivated fruit trees worldwide. Despite being extensively studied because of its commercial relevance, the origin of cultivated citrus species and the history of its domestication still remain an open question. Here we present a phylogenetic analysis of the chloroplast genomes of 34 citrus genotypes which constitutes the most comprehensive and detailed study to date on the evolution and variability of the genus Citrus. A statistical model was used to estimate divergence times between the major citrus groups. Additionally, a complete map of the variability across the genome of different citrus species was produced, including single nucleotide variants, heteroplasmic positions, indels and large structural variants. The distribution of all these variants provided further independent support to the phylogeny obtained. An unexpected finding was the high level of heteroplasmy found in several of the analysed genomes. The use of the complete chloroplast DNA not only paves the way for a better understanding of the phylogenetic relationships within the Citrus genus, but also provides original insights into other elusive evolutionary processes such as chloroplast inheritance, heteroplasmy and gene selection.}, keywords = {chloroplast, citrus, Phylogeny, WGS}, issn = {1537-1719}, doi = {10.1093/molbev/msv082}, url = {http://mbe.oxfordjournals.org/content/early/2015/04/27/molbev.msv082.full}, author = {Carbonell-Caballero, Jos{\'e} and Alonso, Roberto and Iba{\~n}ez, Victoria and Terol, Javier and Talon, Manuel and Dopazo, Joaquin} } @article {494, title = {The role of the interactome in the maintenance of deleterious variability in human populations.}, journal = {Mol Syst Biol}, volume = {10}, year = {2014}, month = {2014 Sep 26}, pages = {752}, abstract = {

Recent genomic projects have revealed the existence of an unexpectedly large amount of deleterious variability in the human genome. Several hypotheses have been proposed to explain such an apparently high mutational load. However, the mechanisms by which deleterious mutations in some genes cause a pathological effect but are apparently innocuous in other genes remain largely unknown. This study searched for deleterious variants in the 1,000 genomes populations, as well as in a newly sequenced population of 252 healthy Spanish individuals. In addition, variants causative of monogenic diseases and somatic variants from 41 chronic lymphocytic leukaemia patients were analysed. The deleterious variants found were analysed in the context of the interactome to understand the role of network topology in the maintenance of the observed mutational load. Our results suggest that one of the mechanisms whereby the effect of these deleterious variants on the phenotype is suppressed could be related to the configuration of the protein interaction network. Most of the deleterious variants observed in healthy individuals are concentrated in peripheral regions of the interactome, in combinations that preserve their connectivity, and have a marginal effect on interactome integrity. On the contrary, likely pathogenic cancer somatic deleterious variants tend to occur in internal regions of the interactome, often with associated structural consequences. Finally, variants causative of monogenic diseases seem to occupy an intermediate position. Our observations suggest that the real pathological potential of a variant might be more a systems property rather than an intrinsic property of individual proteins.

}, keywords = {Alleles, Exome, Gene Library, Genetic Variation, Genetics, Population, Genome, Human, Genomics, Humans, Models, Genetic, mutation, Phenotype, Protein Conformation, Protein Interaction Maps, Sequence Analysis, DNA, Whites}, issn = {1744-4292}, doi = {10.15252/msb.20145222}, author = {Garc{\'\i}a-Alonso, Luz and Jim{\'e}nez-Almaz{\'a}n, Jorge and Carbonell-Caballero, Jos{\'e} and Vela-Boza, Alicia and Santoyo-L{\'o}pez, Javier and Anti{\v n}olo, Guillermo and Dopazo, Joaquin} } @article {483, title = {Sequencing and functional analysis of the genome of a nematode egg-parasitic fungus, Pochonia chlamydosporia.}, journal = {Fungal Genet Biol}, volume = {65}, year = {2014}, month = {2014 Apr}, pages = {69-80}, abstract = {

Pochonia chlamydosporia is a worldwide-distributed soil fungus with a great capacity to infect and destroy the eggs and kill females of plant-parasitic nematodes. Additionally, it has the ability to colonize endophytically roots of economically-important crop plants, thereby promoting their growth and eliciting plant defenses. This multitrophic behavior makes P. chlamydosporia a potentially useful tool for sustainable agriculture approaches. We sequenced and assembled \~{}41 Mb of P. chlamydosporia genomic DNA and predicted 12,122 gene models, of which many were homologous to genes of fungal pathogens of invertebrates and fungal plant pathogens. Predicted genes (65\%) were functionally annotated according to Gene Ontology, and 16\% of them found to share homology with genes in the Pathogen Host Interactions (PHI) database. The genome of this fungus is highly enriched in genes encoding hydrolytic enzymes, such as proteases, glycoside hydrolases and carbohydrate esterases. We used RNA-Seq technology in order to identify the genes expressed during endophytic behavior of P. chlamydosporia when colonizing barley roots. Functional annotation of these genes showed that hydrolytic enzymes and transporters are expressed during endophytism. This structural and functional analysis of the P. chlamydosporia genome provides a starting point for understanding the molecular mechanisms involved in the multitrophic lifestyle of this fungus. The genomic information provided here should also prove useful for enhancing the capabilities of this fungus as a biocontrol agent of plant-parasitic nematodes and as a plant growth-promoting organism.

}, keywords = {Animals, Ascomycota, Female, Gene Expression Regulation, Fungal, Gene ontology, Genome, Fungal, Hordeum, Host-Pathogen Interactions, Nematoda, Ovum, Phylogeny, Plant Roots, Sequence Analysis, DNA, Signal Transduction, Transcriptome}, issn = {1096-0937}, doi = {10.1016/j.fgb.2014.02.002}, author = {Larriba, Eduardo and Jaime, Mar{\'\i}a D L A and Carbonell-Caballero, Jos{\'e} and Conesa, Ana and Dopazo, Joaquin and Nislow, Corey and Mart{\'\i}n-Nieto, Jos{\'e} and Lopez-Llorca, Luis Vicente} }