@article{McEvoy01012009, author = {McEvoy, Brian P and Montgomery, Grant W and McRae, Allan F and Ripatti, Samuli and Perola, Markus and Spector, Tim D and Cherkas, Lynn and Ahmadi, Kourosh R and Boomsma, Dorret and Willemsen, Gonneke and Hottenga, Jouke Jan and Peterson, Nancy L and Magnusson, Patrik KE and Ohm Kyvik, Kirsten and Christensen, Kaare and Kaprio, Jaako and Heikkila, Kauko and Palotie, Aarno and Widen, Elisabeth and Muilu, Juha and Syvanen, Anne-Christine and Liljedahl, Ulrika and Hardiman, Orla and Cronin, Simon and Peltonen, Leena and Martin, Nicholas G and Visscher, Peter M}, title = {Geographical structure and differential natural selection amongst North European populations}, year = {2009}, doi = {10.1101/gr.083394.108}, elocation-id = {gr.083394.108}, abstract ={Population structure can provide novel insight into the human past and recognizing and correcting for such stratification is a practical concern in gene mapping by many association methodologies. We investigate these patterns, primarily through principal component (PC) analysis of whole genome SNP polymorphism, in 2099 individuals from populations of Northern European origin (Ireland, UK, Netherlands, Denmark, Sweden, Finland, Australia and HapMap European-American). The major trends (PC1 and PC2) demonstrate an ability to detect geographic substructure, even over a small area like the British Isles, and this information can then be applied to finely dissect the ancestry of the European-Australian and -American samples. They simultaneously point to the importance of considering population stratification in what might be considered a small homogenous region. There is evidence from FST based analysis of genic and non-genic SNPs that differential positive selection has operated across these populations despite their short divergence time and relatively similar geographic and environmental range. The pressure appears to have been focused on genes involved in immunity, perhaps reflecting response to infectious disease epidemic. Such an event may explain a striking selective sweep centered on the rs2508049-G allele, close to HLA-G gene on chromosome 6. Evidence of the sweep extends over 8Mb/3.5cM region. Overall the results illustrate the power of dense genotype and sample data to explore regional population variation, the events that have crafted it and their implications in both explaining disease prevalence and mapping these genes by association}, URL = {http://genome.cshlp.org/content/early/2009/03/05/gr.083394.108.abstract}, eprint = {http://genome.cshlp.org/content/early/2009/03/05/gr.083394.108.full.pdf+html}, journal = {Genome Research} }