Widespread sharing of long, identical-by-descent (IBD) genetic segments is a
hallmark of populations that have experienced a recent bottleneck. The
detection of these IBD segments is now feasible, enabling a wide range of
applications from phasing and imputation to demographic inference. Here, we
study the distribution of IBD sharing in the Wright-Fisher model. Using
coalescent theory, we calculate the mean and variance of the total sharing
between arbitrary pairs of individuals. We then study the cohort-averaged
sharing: the average total sharing between one individual to the rest of the
cohort. We find that for large cohorts, the cohort-averaged sharing is
distributed approximately normally. Surprisingly, the variance of this
distribution remains large even for large cohorts, implying the existence of
"hyper-sharing" individuals. The presence of such individuals bears important
consequences to the design of sequencing studies, since, if they are selected
for whole-genome sequencing, a larger fraction of the cohort can be
subsequently imputed. We calculate the expected gain in power of imputation by
IBD, and subsequently, in power to detect an association, when individuals are
either randomly selected or are specifically the hyper-sharing individuals.
Finally, we study the distribution of pairwise sharing and cohort-averaged
sharing in the Ashkenazi Jewish population.
%0 Journal Article
%1 carmi2012variance
%A Carmi, Shai
%A Palamara, Pier Francesco
%A Vacic, Vladimir
%A Lencz, Todd
%A Darvasi, Ariel
%A Pe'er, Itsik
%D 2012
%J Genetics
%K IBD Wright-Fisher_model coalescent_theory
%R 10.1534/genetics.112.147215
%T The variance of identity-by-descent sharing in the Wright-Fisher model
%U http://arxiv.org/abs/1206.4745
%X Widespread sharing of long, identical-by-descent (IBD) genetic segments is a
hallmark of populations that have experienced a recent bottleneck. The
detection of these IBD segments is now feasible, enabling a wide range of
applications from phasing and imputation to demographic inference. Here, we
study the distribution of IBD sharing in the Wright-Fisher model. Using
coalescent theory, we calculate the mean and variance of the total sharing
between arbitrary pairs of individuals. We then study the cohort-averaged
sharing: the average total sharing between one individual to the rest of the
cohort. We find that for large cohorts, the cohort-averaged sharing is
distributed approximately normally. Surprisingly, the variance of this
distribution remains large even for large cohorts, implying the existence of
"hyper-sharing" individuals. The presence of such individuals bears important
consequences to the design of sequencing studies, since, if they are selected
for whole-genome sequencing, a larger fraction of the cohort can be
subsequently imputed. We calculate the expected gain in power of imputation by
IBD, and subsequently, in power to detect an association, when individuals are
either randomly selected or are specifically the hyper-sharing individuals.
Finally, we study the distribution of pairwise sharing and cohort-averaged
sharing in the Ashkenazi Jewish population.
@article{carmi2012variance,
abstract = {Widespread sharing of long, identical-by-descent (IBD) genetic segments is a
hallmark of populations that have experienced a recent bottleneck. The
detection of these IBD segments is now feasible, enabling a wide range of
applications from phasing and imputation to demographic inference. Here, we
study the distribution of IBD sharing in the Wright-Fisher model. Using
coalescent theory, we calculate the mean and variance of the total sharing
between arbitrary pairs of individuals. We then study the cohort-averaged
sharing: the average total sharing between one individual to the rest of the
cohort. We find that for large cohorts, the cohort-averaged sharing is
distributed approximately normally. Surprisingly, the variance of this
distribution remains large even for large cohorts, implying the existence of
"hyper-sharing" individuals. The presence of such individuals bears important
consequences to the design of sequencing studies, since, if they are selected
for whole-genome sequencing, a larger fraction of the cohort can be
subsequently imputed. We calculate the expected gain in power of imputation by
IBD, and subsequently, in power to detect an association, when individuals are
either randomly selected or are specifically the hyper-sharing individuals.
Finally, we study the distribution of pairwise sharing and cohort-averaged
sharing in the Ashkenazi Jewish population.},
added-at = {2012-07-16T19:38:58.000+0200},
author = {Carmi, Shai and Palamara, Pier Francesco and Vacic, Vladimir and Lencz, Todd and Darvasi, Ariel and Pe'er, Itsik},
biburl = {https://www.bibsonomy.org/bibtex/2996ca176228199ece07755478c3e5d38/peter.ralph},
doi = {10.1534/genetics.112.147215},
interhash = {02d05acbb099f4cea8b2f35cdf9627b0},
intrahash = {996ca176228199ece07755478c3e5d38},
journal = {Genetics},
keywords = {IBD Wright-Fisher_model coalescent_theory},
month = dec,
pmid = {23267057},
timestamp = {2015-01-20T22:35:53.000+0100},
title = {The variance of identity-by-descent sharing in the {Wright}-{Fisher} model},
url = {http://arxiv.org/abs/1206.4745},
year = 2012
}