@article{Hillier01091996, author = {Hillier, L D and Lennon, G and Becker, M and Bonaldo, M F and Chiapelli, B and Chissoe, S and Dietrich, N and DuBuque, T and Favello, A and Gish, W and Hawkins, M and Hultman, M and Kucaba, T and Lacy, M and Le, M and Le, N and Mardis, E and Moore, B and Morris, M and Parsons, J and Prange, C and Rifkin, L and Rohlfing, T and Schellenberg, K and Marra, M}, title = {Generation and analysis of 280,000 human expressed sequence tags.}, volume = {6}, number = {9}, pages = {807-828}, year = {1996}, doi = {10.1101/gr.6.9.807}, abstract ={We report the generation of 319,311 single-pass sequencing reactions (known as expressed sequence tags, or ESTs) obtained from the 5' and 3' ends of 194,031 human cDNA clones. Our goal has been to obtain tag sequences from many different genes and to deposit these in the publicly accessible Data Base for Expressed Sequence Tags. Highly efficient automatic screening of the data allows deposition of the annotated sequences without delay. Sequences have been generated from 26 oligo(dT) primed directionally cloned libraries, of which 18 were normalized. The libraries were constructed using mRNA isolated from 17 different tissues representing three developmental states. Comparisons of a subset of our data with nonredundant human mRNA and protein data bases show that the ESTs represent many known sequences and contain many that are novel. Analysis of protein families using Hidden Markov Models confirms this observation and supports the contention that although normalization reduces significantly the relative abundance of redundant cDNA clones, it does not result in the complete removal of members of gene families.}, URL = {http://genome.cshlp.org/content/6/9/807.abstract}, eprint = {http://genome.cshlp.org/content/6/9/807.full.pdf+html}, journal = {Genome Research} }