Over the past two decades, microsatellite genotypes have provided the data for landmark studies of human population-genetic variation. However, the various microsatellite data sets have been prepared with different procedures and sets of markers, so that it has been difficult to synthesize available data for a comprehensive analysis. Here, we combine eight human population-genetic data sets at the 645 microsatellite loci they share in common, accounting for procedural differences in the production of the different data sets, to assemble a single data set containing 5795 individuals from 267 worldwide populations. We perform a systematic analysis of genetic relatedness, detecting 240 intra-population and 92 inter-population pairs of previously unidentified close relatives and proposing standardized subsets of unrelated individuals for use in future studies. We then augment the human data with a data set of 84 chimpanzees at the 246 loci they share in common with the human samples. Multidimensional scaling and neighbor-joining analyses of these data sets offer new insights into the structure of human populations and enable a comparison of genetic variation patterns in chimpanzees with those in humans. Our combined data sets are the largest of their kind reported to date and provide a resource for use in human population-genetic studies.
%0 Journal Article
%1 pemberton2013population
%A Pemberton, T J
%A Degiorgio, M
%A Rosenberg, N A
%D 2013
%J G3 (Bethesda)
%K datasets human_genome microsattelites
%N 5
%P 891-907
%R 10.1534/g3.113.005728
%T Population structure in a comprehensive genomic data set on human microsatellite variation
%U http://www.ncbi.nlm.nih.gov/pubmed/23550135
%V 3
%X Over the past two decades, microsatellite genotypes have provided the data for landmark studies of human population-genetic variation. However, the various microsatellite data sets have been prepared with different procedures and sets of markers, so that it has been difficult to synthesize available data for a comprehensive analysis. Here, we combine eight human population-genetic data sets at the 645 microsatellite loci they share in common, accounting for procedural differences in the production of the different data sets, to assemble a single data set containing 5795 individuals from 267 worldwide populations. We perform a systematic analysis of genetic relatedness, detecting 240 intra-population and 92 inter-population pairs of previously unidentified close relatives and proposing standardized subsets of unrelated individuals for use in future studies. We then augment the human data with a data set of 84 chimpanzees at the 246 loci they share in common with the human samples. Multidimensional scaling and neighbor-joining analyses of these data sets offer new insights into the structure of human populations and enable a comparison of genetic variation patterns in chimpanzees with those in humans. Our combined data sets are the largest of their kind reported to date and provide a resource for use in human population-genetic studies.
@article{pemberton2013population,
abstract = {Over the past two decades, microsatellite genotypes have provided the data for landmark studies of human population-genetic variation. However, the various microsatellite data sets have been prepared with different procedures and sets of markers, so that it has been difficult to synthesize available data for a comprehensive analysis. Here, we combine eight human population-genetic data sets at the 645 microsatellite loci they share in common, accounting for procedural differences in the production of the different data sets, to assemble a single data set containing 5795 individuals from 267 worldwide populations. We perform a systematic analysis of genetic relatedness, detecting 240 intra-population and 92 inter-population pairs of previously unidentified close relatives and proposing standardized subsets of unrelated individuals for use in future studies. We then augment the human data with a data set of 84 chimpanzees at the 246 loci they share in common with the human samples. Multidimensional scaling and neighbor-joining analyses of these data sets offer new insights into the structure of human populations and enable a comparison of genetic variation patterns in chimpanzees with those in humans. Our combined data sets are the largest of their kind reported to date and provide a resource for use in human population-genetic studies.},
added-at = {2013-06-19T01:49:21.000+0200},
author = {Pemberton, T J and Degiorgio, M and Rosenberg, N A},
biburl = {https://www.bibsonomy.org/bibtex/28dc38731ffe87d0c75a5a584c4e830e0/peter.ralph},
doi = {10.1534/g3.113.005728},
interhash = {0e60f2a9d6e0876d353bc51cea36f797},
intrahash = {8dc38731ffe87d0c75a5a584c4e830e0},
journal = {G3 (Bethesda)},
keywords = {datasets human_genome microsattelites},
number = 5,
pages = {891-907},
pmid = {23550135},
timestamp = {2013-06-19T01:49:21.000+0200},
title = {Population structure in a comprehensive genomic data set on human microsatellite variation},
url = {http://www.ncbi.nlm.nih.gov/pubmed/23550135},
volume = 3,
year = 2013
}