@article{Chen01072014, author = {Chen, Zhen-Xia and Sturgill, David and Qu, Jiaxin and Jiang, Huaiyang and Park, Soo and Boley, Nathan and Suzuki, Ana Maria and Fletcher, Anthony R. and Plachetzki, David C. and FitzGerald, Peter C. and Artieri, Carlo G. and Atallah, Joel and Barmina, Olga and Brown, James B. and Blankenburg, Kerstin P. and Clough, Emily and Dasgupta, Abhijit and Gubbala, Sai and Han, Yi and Jayaseelan, Joy C. and Kalra, Divya and Kim, Yoo-Ah and Kovar, Christie L. and Lee, Sandra L. and Li, Mingmei and Malley, James D. and Malone, John H. and Mathew, Tittu and Mattiuzzo, Nicolas R. and Munidasa, Mala and Muzny, Donna M. and Ongeri, Fiona and Perales, Lora and Przytycka, Teresa M. and Pu, Ling-Ling and Robinson, Garrett and Thornton, Rebecca L. and Saada, Nehad and Scherer, Steven E. and Smith, Harold E. and Vinson, Charles and Warner, Crystal B. and Worley, Kim C. and Wu, Yuan-Qing and Zou, Xiaoyan and Cherbas, Peter and Kellis, Manolis and Eisen, Michael B. and Piano, Fabio and Kionte, Karin and Fitch, David H. and Sternberg, Paul W. and Cutter, Asher D. and Duff, Michael O. and Hoskins, Roger A. and Graveley, Brenton R. and Gibbs, Richard A. and Bickel, Peter J. and Kopp, Artyom and Carninci, Piero and Celniker, Susan E. and Oliver, Brian and Richards, Stephen}, title = {Comparative validation of the D. melanogaster modENCODE transcriptome annotation}, volume = {24}, number = {7}, pages = {1209-1223}, year = {2014}, doi = {10.1101/gr.159384.113}, abstract ={Accurate gene model annotation of reference genomes is critical for making them useful. The modENCODE project has improved the D. melanogaster genome annotation by using deep and diverse high-throughput data. Since transcriptional activity that has been evolutionarily conserved is likely to have an advantageous function, we have performed large-scale interspecific comparisons to increase confidence in predicted annotations. To support comparative genomics, we filled in divergence gaps in the Drosophila phylogeny by generating draft genomes for eight new species. For comparative transcriptome analysis, we generated mRNA expression profiles on 81 samples from multiple tissues and developmental stages of 15 Drosophila species, and we performed cap analysis of gene expression in D. melanogaster and D. pseudoobscura. We also describe conservation of four distinct core promoter structures composed of combinations of elements at three positions. Overall, each type of genomic feature shows a characteristic divergence rate relative to neutral models, highlighting the value of multispecies alignment in annotating a target genome that should prove useful in the annotation of other high priority genomes, especially human and other mammalian genomes that are rich in noncoding sequences. We report that the vast majority of elements in the annotation are evolutionarily conserved, indicating that the annotation will be an important springboard for functional genetic testing by the Drosophila community.}, URL = {http://genome.cshlp.org/content/24/7/1209.abstract}, eprint = {http://genome.cshlp.org/content/24/7/1209.full.pdf+html}, journal = {Genome Research} }