doc/html/PolySNP_8cc_source.html

 /*

 Copyright (C) 2003-2009 Kevin Thornton, krthornt[]@[]uci.edu

 Remove the brackets to email me.

 This file is part of libsequence.

 libsequence is free software: you can redistribute it and/or modify
 it under the terms of the GNU General Public License as published by
 the Free Software Foundation, either version 3 of the License, or
 (at your option) any later version.

 libsequence is distributed in the hope that it will be useful,
 but WITHOUT ANY WARRANTY; without even the implied warranty of
 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 GNU General Public License for more details.

 You should have received a copy of the GNU General Public License
 long with libsequence.  If not, see <http://www.gnu.org/licenses/>.

 */

 #include <cmath>
 #include <cfloat>
 #include <cassert>
 #include <utility>
 #include <cstdlib>
 #include <cctype>
 #include <set>
 #include <limits>
 #include <algorithm>
 #include <functional>
 #include <Sequence/PolyTable.hpp>
 #include <Sequence/Comparisons.hpp>
 #include <Sequence/Recombination.hpp>
 #include <Sequence/PolySNP.hpp>
 #include <Sequence/stateCounter.hpp>
 #include <Sequence/SeqConstants.hpp>
 #include <Sequence/PolySNPimpl.hpp>

 using std::string;
 using namespace Sequence::Recombination;

 namespace Sequence
 {
     struct uniqueSeq
         : public std::binary_function<std::string, std::string, bool>
     {
         inline bool
         operator()(const std::string &l, const std::string &r) const
         {
             // use Sequence::Different to prevent missing sites
             // causing 2 sequences to be labelled as distinct
             // return (  Different(l,r) &&
             // std::lexicographical_compare(l.begin(),l.end(),r.begin(),r.end(),lt_nocase())
             // );
             return (Different(l, r)
                     && std::lexicographical_compare(
                            l.begin(), l.end(), r.begin(), r.end(),
                            [](const char &__a, const char __b) {
                                return (std::toupper(
                                            static_cast<unsigned char>(__a))
                                        < std::toupper(
                                              static_cast<unsigned char>(__b)));
                            }));
         }
     };
     _PolySNPImpl::_PolySNPImpl(const Sequence::PolyTable *data,
                                const bool &haveOutgroup,
                                const unsigned &outgroup, const bool &totMuts)
         : _data(data), _nsites(data->numsites()),
           _nsam(unsigned(data->size())), _outgroup(outgroup),
           _haveOutgroup(haveOutgroup), _totMuts(totMuts),
           _totsam(unsigned(data->size())), _DVK(0), _DVH(1.0),
           _counted_singletons(false), _know_pi(false), _CalculatedDandV(false),
           _pi(0.), _singletons(0), _walls_Bprime(0), _NumPoly(0), _walls_B(0.),
           _walls_Q(0.), _calculated_wall_stats(false),
           _counts(std::vector<Sequence::stateCounter>(
               _nsites, Sequence::stateCounter('-'))),
           _derivedCounts(std::vector<std::pair<bool, stateCounter>>(
               _nsites,
               std::make_pair<bool, stateCounter>(true, stateCounter('-')))),
           _preprocessed(false)
     {
         if (haveOutgroup)
             --_totsam; // because one sequence in data is an outgroup!
         preprocess();
     }

     void
     _PolySNPImpl::preprocess()
     {
         if (!_preprocessed)
             {
                 for (unsigned site = 0; site < _nsites; ++site)
                     {
                         for (unsigned seq = 0; seq < _nsam; ++seq)
                             {
                                 // process counts w/o respect to
                                 // ancestral or derived
                                 if (!_haveOutgroup
                                     || (_haveOutgroup && seq != _outgroup))
                                     {
                                         _counts[site]((*_data)[seq][site]);
                                     }
                                 // process derived states if outgroup is
                                 // present
                                 if (_haveOutgroup == true)
                                     {
                                         // if outgroup state is missing data
                                         // or a gap
                                         // set the bool for that site to false
                                         if (std::toupper(
                                                 (*_data)[_outgroup][site])
                                                 == 'N'
                                             || (*_data)[_outgroup][site]
                                                    == '-')
                                             {
                                                 _derivedCounts[site].first
                                                     = false;
                                             }
                                         else
                                             {
                                                 // tabulate the derived state
                                                 _derivedCounts[site].first
                                                     = true;
                                                 if (seq != _outgroup
                                                     && (*_data)[seq][site]
                                                            != (*_data)
                                                                   [_outgroup]
                                                                   [site])
                                                     {
                                                         _derivedCounts[site]
                                                             .second((
                                                                 *_data)[seq]
                                                                        [site]);
                                                     }
                                             }
                                     }
                                 else
                                     {
                                         // if no outgroup, set bool
                                         // for site to false
                                         _derivedCounts[site].first = false;
                                     }
                             }
                         if (_counts[site].nStates() > 1
                             && _counts[site].gap == 0)
                             ++_NumPoly;
                     }
                 _preprocessed = true;
             }
     }

     PolySNP::PolySNP(const Sequence::PolyTable *data, bool haveOutgroup,
                      unsigned outgroup, bool totMuts)
         : rep(std::unique_ptr<_PolySNPImpl>(
               new _PolySNPImpl(data, haveOutgroup, outgroup, totMuts)))
     {
     }

     PolySNP::~PolySNP(void) {}

     double
     PolySNP::ThetaPi(void) const
     {
         assert(rep->_preprocessed);
         std::lock_guard<std::mutex> lock(rep->instance_lock);
         if (rep->_know_pi == false)
             {
                 double Pi = 0.0;
                 for (unsigned i = 0; i < rep->_nsites; ++i)
                     { // iterate over sites
                         if (rep->_counts[i].gap == 0
                             && rep->_counts[i].nStates() > 1)
                             {
                                 unsigned samplesize = rep->_totsam;
                                 samplesize
                                     -= rep->_counts[i].n; // adjust sample size
                                                           // for missing data
                                 if (samplesize > 1)
                                     {
                                         double SSH
                                             = 0.0; // sum of site homozygosity
                                         double denom
                                             = (double(samplesize)
                                                * (double(samplesize) - 1.0));
                                         SSH += (rep->_counts[i].a > 0)
                                                    ? double(rep->_counts[i].a)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .a
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         SSH += (rep->_counts[i].g > 0)
                                                    ? double(rep->_counts[i].g)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .g
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         SSH += (rep->_counts[i].c > 0)
                                                    ? double(rep->_counts[i].c)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .c
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         SSH += (rep->_counts[i].t > 0)
                                                    ? double(rep->_counts[i].t)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .t
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         SSH += (rep->_counts[i].zero > 0)
                                                    ? double(
                                                          rep->_counts[i].zero)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .zero
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         SSH += (rep->_counts[i].one > 0)
                                                    ? double(
                                                          rep->_counts[i].one)
                                                          * double(
                                                                rep->_counts[i]
                                                                    .one
                                                                - 1)
                                                          / denom
                                                    : 0.;
                                         Pi += (1.0 - SSH);
                                     }
                             }
                     }
                 rep->_pi = Pi;
                 rep->_know_pi = true;
                 return rep->_pi;
             }
         else
             return rep->_pi;
         return rep->_pi;
     }

     double
     PolySNP::ThetaW(void) const
     {
         assert(rep->_preprocessed);
         double W = 0.0;
         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sitesvv
                 if (rep->_counts[i].gap == 0)
                     {
                         unsigned nstates = rep->_counts[i].nStates();
                         unsigned nsam_site = rep->_totsam - rep->_counts[i].n;
                         double denom = 0.0;
                         if (rep->_totMuts == true && nstates >= 2)
                             {
                                 for (unsigned i = 1; i < nsam_site; ++i)
                                     denom += 1.0 / double(i);
                                 W += double(nstates - 1) / denom;
                             }
                         else if (rep->_totMuts == false && nstates >= 2)
                             {
                                 for (unsigned i = 1; i < nsam_site; ++i)
                                     denom += 1.0 / double(i);
                                 W += 1.0 / denom;
                             }
                     }
             }
         return (W);
     }

     double
     PolySNP::ThetaH(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return 0.;
         if (!rep->_haveOutgroup)
             return std::numeric_limits<double>::quiet_NaN();
         double H = 0.0;
         bool anc_is_present = 0; // is ancestral state present in the ingroup?

         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 if (rep->_derivedCounts[i].second.gap == 0)
                     {
                         unsigned samplesize
                             = rep->_totsam; // sample size per site
                         unsigned sumDerCounts = 0;
                         sumDerCounts += rep->_derivedCounts[i].second.a;
                         sumDerCounts += rep->_derivedCounts[i].second.g;
                         sumDerCounts += rep->_derivedCounts[i].second.c;
                         sumDerCounts += rep->_derivedCounts[i].second.t;
                         sumDerCounts += rep->_derivedCounts[i].second.zero;
                         sumDerCounts += rep->_derivedCounts[i].second.one;
                         unsigned ancestralCounts
                             = samplesize - sumDerCounts
                               - rep->_derivedCounts[i].second.n;

                         // if the ancestral state is not missing data, and
                         // the sum of the derived counts + and missing data in
                         // the ingroup
                         // does not equal the sample size, then the ancestral
                         // state is present
                         // at least once in the ingroup, and anc_is_present =
                         // true
                         anc_is_present = (rep->_derivedCounts[i].first == true
                                           && ancestralCounts > 0)
                                              ? true
                                              : false;
                         if (anc_is_present) // ancestral state must be present
                             {
                                 // number of derived states seen at this site
                                 unsigned numDer
                                     = rep->_derivedCounts[i].second.nStates();
                                 if (numDer == 1)
                                     { // simple if there is only one derived
                                         // state inferred
                                         samplesize
                                             -= rep->_derivedCounts[i].second.n;
                                         double denom
                                             = (double(samplesize)
                                                * (double(samplesize) - 1.0));
                                         H += (rep->_derivedCounts[i].second.a
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .a),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                         H += (rep->_derivedCounts[i].second.g
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .g),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                         H += (rep->_derivedCounts[i].second.c
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .c),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                         H += (rep->_derivedCounts[i].second.t
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .t),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                         H += (rep->_derivedCounts[i]
                                                   .second.zero
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .zero),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                         H += (rep->_derivedCounts[i].second.one
                                               > 0)
                                                  ? (2.0
                                                     * pow(double(
                                                               rep->_derivedCounts
                                                                   [i]
                                                                       .second
                                                                       .one),
                                                           2.0))
                                                        / denom
                                                  : 0.;
                                     }
                                 else if (numDer == 2
                                          && rep->_haveOutgroup) // MUST have
                                     // outgroup--else
                                     // can't proceed
                                     { // use a "missing data" scheme if there
                                         // is >1 derived state
                                         // iterate over derived states
                                         unsigned config[2];
                                         unsigned k = 0;
                                         if (rep->_derivedCounts[i].second.a
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.a;
                                             }
                                         if (rep->_derivedCounts[i].second.g
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.g;
                                             }
                                         if (rep->_derivedCounts[i].second.c
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.c;
                                             }
                                         if (rep->_derivedCounts[i].second.t
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.t;
                                             }
                                         if (rep->_derivedCounts[i].second.zero
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.zero;
                                             }
                                         if (rep->_derivedCounts[i].second.one
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.one;
                                             }
                                         for (int i = 0; i < 2; ++i)
                                             {
                                                 double sample_size_adjust
                                                     = (i == 0)
                                                           ? double(config[1])
                                                           : double(config[0]);
                                                 H += (2.0
                                                       * pow(double(config[i]),
                                                             2.0))
                                                      / ((double(samplesize)
                                                          - sample_size_adjust)
                                                         * (double(samplesize)
                                                            - sample_size_adjust
                                                            - 1.0));
                                             }
                                     }
                             }
                     }
             }
         return H;
     }

     double
     PolySNP::ThetaL(void) const
     {
         if (!rep->_haveOutgroup)
             {
                 return std::numeric_limits<double>::quiet_NaN();
             }
         assert(rep->_preprocessed);
         double thetal = 0.0;
         if (rep->_NumPoly == 0)
             return thetal;
         bool anc_is_present = 0; // is ancestral state present in the ingroup?

         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 if (rep->_derivedCounts[i].first == true
                     && rep->_derivedCounts[i].second.gap == 0)
                     {
                         unsigned samplesize
                             = rep->_totsam; // sample size per site
                         unsigned sumDerCounts = 0;
                         sumDerCounts += rep->_derivedCounts[i].second.a;
                         sumDerCounts += rep->_derivedCounts[i].second.g;
                         sumDerCounts += rep->_derivedCounts[i].second.c;
                         sumDerCounts += rep->_derivedCounts[i].second.t;
                         sumDerCounts += rep->_derivedCounts[i].second.zero;
                         sumDerCounts += rep->_derivedCounts[i].second.one;
                         unsigned ancestralCounts
                             = samplesize - sumDerCounts
                               - rep->_derivedCounts[i].second.n;

                         // if the ancestral state is not missing data, and
                         // the sum of the derived counts + and missing data in
                         // the ingroup
                         // does not equal the sample size, then the ancestral
                         // state is present
                         // at least once in the ingroup, and anc_is_present =
                         // true
                         anc_is_present = (rep->_derivedCounts[i].first == true
                                           && ancestralCounts > 0)
                                              ? true
                                              : false;
                         if (anc_is_present) // ancestral state must be present
                             {
                                 // number of derived states seen at this site
                                 unsigned numDer
                                     = rep->_derivedCounts[i].second.nStates();
                                 if (numDer == 1)
                                     { // simple if there is only one derived
                                         // state inferred
                                         samplesize
                                             -= rep->_derivedCounts[i].second.n;
                                         double denom
                                             = (double(samplesize) - 1.0);
                                         thetal
                                             += (rep->_derivedCounts[i].second.a
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.a)
                                                          / denom
                                                    : 0.;
                                         thetal
                                             += (rep->_derivedCounts[i].second.g
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.g)
                                                          / denom
                                                    : 0.;
                                         thetal
                                             += (rep->_derivedCounts[i].second.c
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.c)
                                                          / denom
                                                    : 0.;
                                         thetal
                                             += (rep->_derivedCounts[i].second.t
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.t)
                                                          / denom
                                                    : 0.;
                                         thetal
                                             += (rep->_derivedCounts[i]
                                                     .second.zero
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.zero)
                                                          / denom
                                                    : 0.;
                                         thetal
                                             += (rep->_derivedCounts[i]
                                                     .second.one
                                                 > 0)
                                                    ? double(
                                                          rep->_derivedCounts[i]
                                                              .second.one)
                                                          / denom
                                                    : 0.;
                                     }
                                 else if (numDer == 2
                                          && rep->_haveOutgroup) // MUST have
                                     // outgroup--else
                                     // can't proceed
                                     { // use a "missing data" scheme if there
                                         // is >1 derived state
                                         // iterate over derived states
                                         unsigned config[2];
                                         unsigned k = 0;
                                         if (rep->_derivedCounts[i].second.a
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.a;
                                             }
                                         if (rep->_derivedCounts[i].second.g
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.g;
                                             }
                                         if (rep->_derivedCounts[i].second.c
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.c;
                                             }
                                         if (rep->_derivedCounts[i].second.t
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.t;
                                             }
                                         if (rep->_derivedCounts[i].second.zero
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.zero;
                                             }
                                         if (rep->_derivedCounts[i].second.one
                                             > 0)
                                             {
                                                 config[k++]
                                                     = rep->_derivedCounts[i]
                                                           .second.one;
                                             }
                                         for (int i = 0; i < 2; ++i)
                                             {
                                                 double sample_size_adjust
                                                     = (i == 0)
                                                           ? double(config[1])
                                                           : double(config[0]);
                                                 thetal
                                                     += (double(config[i]))
                                                        / (double(samplesize)
                                                           - sample_size_adjust
                                                           - 1.0);
                                             }
                                     }
                             }
                     }
             }
         return thetal;
     }

     unsigned
     PolySNP::NumPoly(void) const
     {
         assert(rep->_preprocessed);
         unsigned npoly = 0;
         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 if (rep->_counts[i].nStates() > 1 && rep->_counts[i].gap == 0)
                     ++npoly;
             }
         return npoly;
     }

     unsigned
     PolySNP::NumMutations(void) const
     {
         assert(rep->_preprocessed);
         unsigned nmut = 0;

         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 unsigned nstates = (rep->_counts[i].gap == 0)
                                        ? rep->_counts[i].nStates()
                                        : 0;
                 if (nstates > 1)
                     nmut += nstates - 1;
             }
         return nmut;
     }

     unsigned
     PolySNP::NumSingletons(void) const
     {
         assert(rep->_preprocessed);
         unsigned nsing = 0;
         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 unsigned curr_nsing = 0;
                 unsigned nstates = rep->_counts[i].nStates();
                 if (rep->_counts[i].gap == 0 && nstates > 1)
                     {
                         unsigned nsam = rep->_totsam - rep->_counts[i].n;
                         if (nsam == 2 && nstates == 2) // if n = 2 and there
                                                        // are 2 states, there
                                                        // must be 1 singleton
                             curr_nsing = 1;
                         else
                             {
                                 curr_nsing
                                     += (rep->_counts[i].a == 1) ? 1u : 0u;
                                 curr_nsing
                                     += (rep->_counts[i].g == 1) ? 1u : 0u;
                                 curr_nsing
                                     += (rep->_counts[i].c == 1) ? 1u : 0u;
                                 curr_nsing
                                     += (rep->_counts[i].t == 1) ? 1u : 0u;
                                 curr_nsing
                                     += (rep->_counts[i].zero == 1) ? 1u : 0u;
                                 curr_nsing
                                     += (rep->_counts[i].one == 1) ? 1u : 0u;
                             }
                     }
                 nsing += curr_nsing;
             }
         return nsing;
     }

     unsigned
     PolySNP::NumExternalMutations(void) const
     {
         if (!rep->_haveOutgroup)
             return SEQMAXUNSIGNED;
         assert(rep->_preprocessed);
         unsigned next = 0;
         for (unsigned i = 0; i < rep->_nsites; ++i)
             { // iterate over sites
                 unsigned nsam = rep->_totsam;
                 unsigned curr_next = 0;
                 if (rep->_derivedCounts[i].first == true
                     && rep->_derivedCounts[i].second.gap == 0)
                     {
                         nsam -= rep->_derivedCounts[i].second.n;
                         curr_next += (rep->_derivedCounts[i].second.a == 1)
                                          ? 1u
                                          : 0u;
                         curr_next += (rep->_derivedCounts[i].second.g == 1)
                                          ? 1u
                                          : 0u;
                         curr_next += (rep->_derivedCounts[i].second.c == 1)
                                          ? 1u
                                          : 0u;
                         curr_next += (rep->_derivedCounts[i].second.t == 1)
                                          ? 1u
                                          : 0u;
                         curr_next += (rep->_derivedCounts[i].second.zero == 1)
                                          ? 1u
                                          : 0u;
                         curr_next += (rep->_derivedCounts[i].second.one == 1)
                                          ? 1u
                                          : 0u;
                     }
                 next += (nsam > 1) ? curr_next : 0u;
             }
         return next;
     }

     double
     PolySNP::TajimasD(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         double D = 0.0;
         double Pi = ThetaPi();
         double W = ThetaW();
         if (fabs(Pi - 0.) <= DBL_EPSILON && fabs(W - 0.) <= DBL_EPSILON)
             D = 0.0;
         else
             D = (Pi - W) / Dnominator();
         return D;
     }

     double
     PolySNP::Hprime(const bool &likeThorntonAndolfatto) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         assert(rep->_haveOutgroup == true);
         double a = a_sub_n();
         double b = b_sub_n();
         double pi = ThetaPi();
         double theta = ThetaW();

         double thetal = ThetaL();
         double b_n_plus1 = b_sub_n_plus1();
         double S = (rep->_totMuts) ? NumMutations() : NumPoly();
         double thetasq = (likeThorntonAndolfatto == false)
                              ? S * (S - 1) / (a * a + b)
                              : theta * theta;

         double vThetal = (rep->_totsam * theta) / (2.0 * (rep->_totsam - 1.0))
                          + (2.0 * pow(rep->_totsam / (rep->_totsam - 1.0), 2.0)
                                 * (b_n_plus1 - 1.0)
                             - 1.0)
                                * thetasq;

         double vPi
             = (3.0 * rep->_totsam * (rep->_totsam + 1.0) * theta
                + 2.0 * (rep->_totsam * rep->_totsam + rep->_totsam + 3.0)
                      * thetasq)
               / (9 * rep->_totsam * (rep->_totsam - 1.0));

         double cov
             = ((rep->_totsam + 1.0) / (3.0 * (rep->_totsam - 1.0))) * theta
               + ((7.0 * rep->_totsam * rep->_totsam + 3.0 * rep->_totsam - 2.0
                   - 4.0 * rep->_totsam * (rep->_totsam + 1.0) * b_n_plus1)
                  / (2.0 * pow((rep->_totsam - 1.0), 2.0)))
                     * thetasq;

         double Hpr = pi - thetal;
         Hpr /= pow((vThetal + vPi - 2.0 * cov), 0.5);
         return (Hpr);
     }

     double
     PolySNP::Dnominator(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         double S = 0.0;
         if (rep->_totMuts)
             {
                 S = double(NumMutations());
             }
         else if (!(rep->_totMuts))
             {
                 S = double(NumPoly());
             }
         double a1, a2, b1, b2, c1, c2, e1, e2;

         a1 = a_sub_n();
         a2 = b_sub_n();
         b1 = (rep->_totsam + 1.0) / (3.0 * (rep->_totsam - 1.0));
         b2 = (2.0 * (pow(rep->_totsam, 2.0) + rep->_totsam + 3.0))
              / (9.0 * rep->_totsam * (rep->_totsam - 1.0));
         c1 = b1 - 1.0 / a1;
         c2 = b2 - (rep->_totsam + 2.0) / (a1 * rep->_totsam)
              + a2 / pow(a1, 2.0);
         e1 = c1 / a1;
         e2 = c2 / (pow(a1, 2.0) + a2);
         double denominator = pow((e1 * S + e2 * S * (S - 1.0)), 0.5);
         return (denominator);
     }

     void
     PolySNP::DepaulisVeuilleStatistics(void) const
     {
         assert(rep->_preprocessed);
         std::lock_guard<std::mutex> lock(rep->instance_lock);
         if (!(rep->_CalculatedDandV))
             {
                 if (rep->_NumPoly == 0)
                     {
                         rep->_DVK = 1;
                         rep->_DVH = 0.;
                         return;
                     }
                 if (rep->_data->size() > 0)
                     {
                         // step 1 : determine which sequences are unique in the
                         // data,
                         // exluding missing data
                         std::set<string, uniqueSeq> unique_haplotypes;
                         if (rep->_haveOutgroup)
                             {
                                 unique_haplotypes.insert(rep->_data->begin(),
                                                          rep->_data->begin()
                                                              + rep->_outgroup);
                                 unique_haplotypes.insert(
                                     rep->_data->begin() + rep->_outgroup + 1,
                                     rep->_data->end());
                             }
                         else
                             {
                                 unique_haplotypes.insert(rep->_data->begin(),
                                                          rep->_data->end());
                             }
                         std::vector<std::string> vuhaps(
                             unique_haplotypes.size());
                         rep->_DVK = unsigned(unique_haplotypes.size());
                         std::move(unique_haplotypes.begin(),
                                   unique_haplotypes.end(), vuhaps.begin());
                         double homozygosity = 0.0;
                         for (auto &uh : vuhaps)
                             {
                                 double c = 0.0;
                                 if (rep->_haveOutgroup)
                                     {
                                         c = static_cast<double>(std::count_if(
                                             rep->_data->begin(),
                                             rep->_data->begin()
                                                 + rep->_outgroup,
                                             [&uh](const std::string &__s) {
                                                 return !Different(__s, uh,
                                                                   false, true);
                                             }));
                                         c += static_cast<double>(std::count_if(
                                             rep->_data->begin()
                                                 + rep->_outgroup + 1,
                                             rep->_data->end(),
                                             [&uh](const std::string &__s) {
                                                 return !Different(__s, uh,
                                                                   false, true);
                                             }));
                                     }
                                 else
                                     {
                                         c = static_cast<double>(std::count_if(
                                             rep->_data->begin(),
                                             rep->_data->end(),
                                             [&uh](const std::string &__s) {
                                                 return !Different(__s, uh,
                                                                   false, true);
                                             }));
                                     }
                                 c /= static_cast<double>(rep->_totsam);
                                 homozygosity += pow(c, 2.);
                             }
                         rep->_DVH -= homozygosity;
                         rep->_DVH *= rep->_totsam / (rep->_totsam - 1.0);
                         rep->_CalculatedDandV = 1;
                     }
             }
     }

     double
     PolySNP::WallsB(void) const
     {
         assert(rep->_preprocessed);
         WallStats();
         return rep->_walls_B;
     }

     void
     PolySNP::WallStats(void) const
     {
         assert(rep->_preprocessed);
         if (!rep->_calculated_wall_stats)
             {
                 unsigned S = 0;
                 // explicity count # of bi-allelic sites,
                 // since that's the proper denominator
                 for (std::vector<stateCounter>::const_iterator itr
                      = rep->_counts.begin();
                      itr < rep->_counts.end(); ++itr)
                     {
                         if (itr->nStates() == 2 && itr->gap == 0)
                             ++S;
                     }
                 if (S > 1)
                     {
                         // std::ptrdiff_t nhap_curr, nhap_left;
                         std::set<std::basic_string<char>,
                                  Sequence::uniqueSeq>::size_type nhap_curr,
                             nhap_left;

                         nhap_left = SEQMAXUNSIGNED;

                         unsigned A = 0; // number of partitions with D' = 1
                                         // (see Wall 1999)
                         // iterate over sites (actually, adjacent pairs of
                         // sites)
                         for (unsigned site1 = 0; site1 < rep->_nsites - 1;
                              ++site1)
                             {
                                 for (unsigned site2 = site1 + 1;
                                      site2 < rep->_nsites; ++site2)
                                     {
                                         if (rep->_counts[site1].nStates() == 2
                                             && rep->_counts[site2].nStates()
                                                    == 2)
                                             {
                                                 std::string config;
                                                 config.resize(2);
                                                 std::set<string, uniqueSeq>
                                                     unique_haplotypes;
                                                 nhap_curr = 0;
                                                 for (unsigned i = 0;
                                                      i < rep->_nsam; ++i)
                                                     {
                                                         if ((!rep->_haveOutgroup)
                                                             || (rep->_haveOutgroup
                                                                 && i != rep->_outgroup))
                                                             {
                                                                 config[0]
                                                                     = (*rep->_data)
                                                                         [i]
                                                                         [site1];
                                                                 config[1]
                                                                     = (*rep->_data)
                                                                         [i]
                                                                         [site2];
                                                                 unique_haplotypes
                                                                     .insert(
                                                                         config);
                                                             }
                                                     }
                                                 nhap_curr
                                                     = unique_haplotypes.size();
                                                 if (site1 == 0)
                                                     {
                                                         if (nhap_curr == 2)
                                                             {
                                                                 ++rep->_walls_Bprime;
                                                                 ++A;
                                                             }
                                                     }
                                                 else
                                                     {
                                                         if (nhap_curr == 2)
                                                             ++rep->_walls_Bprime;
                                                         if (nhap_curr == 2
                                                             && nhap_left != 2)
                                                             ++A;
                                                     }
                                                 nhap_left = nhap_curr;
                                                 site1 = site2;
                                             }
                                     }
                             }
                         rep->_walls_B
                             = double(rep->_walls_Bprime) / (double(S - 1));
                         rep->_walls_Q
                             = (double(rep->_walls_Bprime) + double(A))
                               / (double(S));
                     }
                 else
                     {
                         rep->_walls_B
                             = std::numeric_limits<double>::quiet_NaN();
                         rep->_walls_Bprime = 0;
                         rep->_walls_Q
                             = std::numeric_limits<double>::quiet_NaN();
                     }
             }
         rep->_calculated_wall_stats = true;
     }

     unsigned
     PolySNP::WallsBprime(void) const
     {
         assert(rep->_preprocessed);
         WallStats();
         return rep->_walls_Bprime;
     }

     double
     PolySNP::WallsQ(void) const
     {
         assert(rep->_preprocessed);
         WallStats();
         return rep->_walls_Q;
     }

     double
     PolySNP::VarPi(void) const
     {
         if (rep->_data->empty() || !NumPoly())
             return std::numeric_limits<double>::quiet_NaN();
         double Pi = ThetaPi();
         double variance = 3.0 * rep->_totsam * (rep->_totsam + 1.0) * Pi
                           + 2.0 * (pow(rep->_totsam, 2.0) + rep->_totsam + 3.0)
                                 * pow(Pi, 2.0);
         variance /= (11.0 * pow(rep->_totsam, 2.0) - 7.0 * rep->_totsam + 6.0);
         return (variance);
     }

     double
     PolySNP::StochasticVarPi(void) const
     {
         if (rep->_data->empty() || !NumPoly())
             return std::numeric_limits<double>::quiet_NaN();
         double Pi = ThetaPi();
         double variance
             = (3.0 * pow(rep->_totsam, 2.0) - 3.0 * rep->_totsam + 2.0) * Pi
               + 2.0 * rep->_totsam * (rep->_totsam - 1.0) * pow(Pi, 2.0);
         variance /= (11.0 * pow(rep->_totsam, 2.0) - 7.0 * rep->_totsam + 6.0);
         return (variance);
     }

     double
     PolySNP::SamplingVarPi(void) const
     {
         if (rep->_data->empty() || !NumPoly())
             return std::numeric_limits<double>::quiet_NaN();
         double Pi = ThetaPi();
         double variance = 2.0 * (3.0 * rep->_totsam - 1.0) * Pi
                           + 2.0 * (2.0 * rep->_totsam + 3.0) * pow(Pi, 2.0);
         variance /= (11.0 * pow(rep->_totsam, 2.0) - 7.0 * rep->_totsam + 6.0);
         return (variance);
     }

     double
     PolySNP::VarThetaW(void) const
     {
         if (rep->_data->empty() || !NumPoly())
             return std::numeric_limits<double>::quiet_NaN();
         double a1 = a_sub_n();
         double a2 = b_sub_n();
         double S = (rep->_totMuts) ? NumMutations() : NumPoly();
         double variance = pow(a1, 2.0) * S + a2 * pow(S, 2.0);
         variance /= pow(a1, 2.0) * (pow(a1, 2.0) + a2);
         return (variance);
     }

     // correct
     double
     PolySNP::FuLiD(void) const
     {
         assert(rep->_preprocessed);
         //    assert(rep->_haveOutgroup == true);
         if (rep->_NumPoly == 0 || !rep->_haveOutgroup)
             return std::numeric_limits<double>::quiet_NaN();
         double ExternalMutations = double(NumExternalMutations());
         double NumMut = double(NumMutations());
         double a = a_sub_n();
         double b = b_sub_n();
         double c = c_sub_n();
         double vD = 1.0
                     + (pow(a, 2.0) / (b + pow(a, 2.0))
                        * (c - (rep->_totsam + 1.0) / (rep->_totsam - 1.0)));
         double uD = a - 1.0 - vD;
         double D = NumMut - a * double(ExternalMutations);
         D /= pow((uD * NumMut + vD * pow(NumMut, 2.0)), 0.5);
         return (D);
     }

     // correct
     double
     PolySNP::FuLiF(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0 || !rep->_haveOutgroup)
             return std::numeric_limits<double>::quiet_NaN();
         double Pi = ThetaPi();
         double NumMut = double(NumMutations());
         double ExternalMutations = double(NumExternalMutations());
         double a = a_sub_n();
         double a_n_plus1 = a_sub_n_plus1();
         double b = b_sub_n();
         double c = c_sub_n();
         double vF
             = c
               + 2.0 * (pow(rep->_totsam, 2.0) + rep->_totsam + 3.0)
                     / (9.0 * rep->_totsam * (double(rep->_totsam - 1.0)));
         vF -= (2.0 / (rep->_totsam - 1.0));
         vF /= (pow(a, 2.0) + b);

         double uF
             = 1.0
               + (rep->_totsam + 1.0) / (3.0 * (double(rep->_totsam - 1.0)));
         uF -= 4.0 * ((rep->_totsam + 1.0) / (pow(rep->_totsam - 1.0, 2.0)))
               * (a_n_plus1 - 2.0 * rep->_totsam / (rep->_totsam + 1.0));
         uF /= a;
         uF -= vF;

         double F = Pi - ExternalMutations;
         F /= pow(uF * NumMut + vF * pow(NumMut, 2.0), 0.5);
         return (F);
     }

     // correct
     double
     PolySNP::FuLiDStar(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         double Singletons = double(NumSingletons());
         double NumMut = double(NumMutations());

         double a = a_sub_n();
         double b = b_sub_n();
         double d = d_sub_n();

         double vD = pow(rep->_totsam / (rep->_totsam - 1.0), 2.0) * b;
         vD += pow(a, 2.0) * d;
         vD -= 2.0 * (rep->_totsam * a * (a + 1.0))
               / (pow(double(rep->_totsam - 1.0), 2.0));
         vD /= (pow(a, 2.0) + b);

         double uD = (rep->_totsam / (rep->_totsam - 1.0))
                         * (a - (rep->_totsam / (rep->_totsam - 1.0)))
                     - vD;

         double DStar = (rep->_totsam / (rep->_totsam - 1.0)) * NumMut
                        - a * double(Singletons);
         DStar /= pow(uD * NumMut + vD * pow(NumMut, 2.0), 0.5);
         return (DStar);
     }

     // correct
     double
     PolySNP::FuLiFStar(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         double Singletons = double(NumSingletons());
         double Pi = ThetaPi();
         double NumMut = double(NumMutations());

         double a = a_sub_n();
         double a_n_plus1 = a_sub_n_plus1();
         double b = b_sub_n();
         // vF is taken from the correction published by
         // Simonsen et al.  (1995) Genetics 141: 413, eqn A5
         double vF = 2.0 * pow(rep->_totsam, 3.0)
                     + 110.0 * pow(rep->_totsam, 2.0) - 255.0 * rep->_totsam
                     + 153.0;
         vF /= (9.0 * pow(rep->_totsam, 2.0) * (rep->_totsam - 1.0));
         vF += (((2.0 * (rep->_totsam - 1.0) * a) / pow(rep->_totsam, 2.0))
                - (8.0 * b / rep->_totsam));
         vF /= (pow(a, 2.0) + b);

         double uF = (4.0 * pow(rep->_totsam, 2.0) + 19.0 * rep->_totsam + 3.0
                      - 12.0 * (rep->_totsam + 1.0) * a_n_plus1);
         uF /= (3.0 * rep->_totsam * (rep->_totsam - 1.0));
         uF /= a;
         uF -= vF;
         double FStar
             = Pi
               - (((rep->_totsam - 1.0) / rep->_totsam)) * double(Singletons);
         FStar /= pow((uF * NumMut + vF * pow(NumMut, 2.0)), 0.5);
         return (FStar);
     }

     double
     PolySNP::a_sub_n(void) const
     {
         assert(rep->_preprocessed);
         int i;
         double a = 0.0;
         for (i = 1; i < int(rep->_totsam); ++i)
             a += 1. / double(i);
         return a;
     }

     double
     PolySNP::a_sub_n_plus1(void) const
     { // used by Fu and Li tests
         assert(rep->_preprocessed);
         int i;
         double a = 0.0;
         for (i = 1; i < int(rep->_totsam) + 1; ++i)
             {
                 a += 1. / double(i);
             }
         return (a);
     }

     double
     PolySNP::b_sub_n(void) const
     { // sum of 1/i^2
         assert(rep->_preprocessed);
         int i;
         double b = 0.0;
         for (i = 1; i < int(rep->_totsam); ++i)
             b += 1. / (pow(double(i), 2.0));
         return b;
     }

     double
     PolySNP::b_sub_n_plus1(void) const
     { // sum of 1/i^2
         assert(rep->_preprocessed);
         int i;
         double b = 0.0;
         for (i = 1; i < int(rep->_totsam) + 1; ++i)
             b += 1. / (pow(double(i), 2.0));
         return b;
     }

     double
     PolySNP::c_sub_n(void) const
     { // from Fu and Li 93
         assert(rep->_preprocessed);
         double c = 0.0, a = a_sub_n();
         if (fabs(rep->_totsam - 2.) <= DBL_EPSILON)
             {
                 c = 1.0;
             }
         else
             {
                 c = 2.0 * (rep->_totsam * a - 2.0 * (rep->_totsam - 1.0));
                 c /= ((rep->_totsam - 1.0) * (rep->_totsam - 2.0));
             }
         return c;
     }

     double
     PolySNP::d_sub_n(void) const
     { // from Fu and Li 93
         assert(rep->_preprocessed);
         double a_n_plus1, c, d;
         a_n_plus1 = a_sub_n_plus1();
         c = c_sub_n();
         d = c + (rep->_totsam - 2.0) / (pow(rep->_totsam - 1.0, 2.0));
         d += (2.0 / (rep->_totsam - 1.0))
              * (1.5 - ((2.0 * a_n_plus1 - 3.0) / (rep->_totsam - 2.0))
                 - 1.0 / rep->_totsam);
         return d;
     }

     double
     PolySNP::DandVH(void) const
     {
         if (!(rep->_CalculatedDandV))
             DepaulisVeuilleStatistics();

         return rep->_DVH;
     }

     unsigned
     PolySNP::DandVK(void) const
     {
         if (!(rep->_CalculatedDandV))
             DepaulisVeuilleStatistics();

         return rep->_DVK;
     }

     double
     PolySNP::HudsonsC(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly == 0)
             return std::numeric_limits<double>::quiet_NaN();
         return (Recombination::HudsonsC(rep->_data, rep->_haveOutgroup,
                                         rep->_outgroup));
     }

     unsigned
     PolySNP::Minrec(void) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly < 2)
             return SEQMAXUNSIGNED;
         unsigned a, b, e, numgametes, Rmin = 0, x = 0;
         bool flag = false;

         for (a = x + 1; a < rep->_nsites; ++a)
             {
                 char c11, c12;
                 unsigned states1 = 0;
                 c11 = c12 = 'Z'; // Z is a dummy value
                 // count # states in site a
                 states1 = rep->_counts[a].nStates();

                 c11 = (c11 == 'Z' && rep->_counts[a].a > 0) ? 'A' : 'Z';
                 c11 = (c11 == 'Z' && rep->_counts[a].g > 0) ? 'G' : c11;
                 c11 = (c11 == 'Z' && rep->_counts[a].c > 0) ? 'C' : c11;
                 c11 = (c11 == 'Z' && rep->_counts[a].t > 0) ? 'T' : c11;
                 c11 = (c11 == 'Z' && rep->_counts[a].zero > 0) ? '0' : c11;
                 c11 = (c11 == 'Z' && rep->_counts[a].one > 0) ? '1' : c11;

                 c12 = (c12 == 'Z' && c11 != 'A' && rep->_counts[a].a > 0)
                           ? 'A'
                           : 'Z';
                 c12 = (c12 == 'Z' && c11 != 'G' && rep->_counts[a].g > 0)
                           ? 'G'
                           : c12;
                 c12 = (c12 == 'Z' && c11 != 'C' && rep->_counts[a].c > 0)
                           ? 'C'
                           : c12;
                 c12 = (c12 == 'Z' && c11 != 'T' && rep->_counts[a].t > 0)
                           ? 'T'
                           : c12;
                 c12 = (c12 == 'Z' && c11 != '0' && rep->_counts[a].zero > 0)
                           ? '0'
                           : c12;
                 c12 = (c12 == 'Z' && c11 != '1' && rep->_counts[a].one > 0)
                           ? '1'
                           : c12;

                 for (b = (flag == false) ? x : a - 1; b < a; ++b)
                     {
                         flag = false;
                         numgametes = 0;
                         unsigned states2 = rep->_counts[b].nStates();
                         // need to skip sites with > 2 states
                         if (states1 == 2 && states2 == 2)
                             {
                                 char c21 = 'Z', c22 = 'Z';
                                 c21 = (c21 == 'Z' && rep->_counts[b].a > 0)
                                           ? 'A'
                                           : 'Z';
                                 c21 = (c21 == 'Z' && rep->_counts[b].g > 0)
                                           ? 'G'
                                           : c21;
                                 c21 = (c21 == 'Z' && rep->_counts[b].c > 0)
                                           ? 'C'
                                           : c21;
                                 c21 = (c21 == 'Z' && rep->_counts[b].t > 0)
                                           ? 'T'
                                           : c21;
                                 c21 = (c21 == 'Z' && rep->_counts[b].zero > 0)
                                           ? '0'
                                           : c21;
                                 c21 = (c21 == 'Z' && rep->_counts[b].one > 0)
                                           ? '1'
                                           : c21;

                                 c22 = (c22 == 'Z' && c21 != 'A'
                                        && rep->_counts[b].a > 0)
                                           ? 'A'
                                           : 'Z';
                                 c22 = (c22 == 'Z' && c21 != 'G'
                                        && rep->_counts[b].g > 0)
                                           ? 'G'
                                           : c22;
                                 c22 = (c22 == 'Z' && c21 != 'C'
                                        && rep->_counts[b].c > 0)
                                           ? 'C'
                                           : c22;
                                 c22 = (c22 == 'Z' && c21 != 'T'
                                        && rep->_counts[b].t > 0)
                                           ? 'T'
                                           : c22;
                                 c22 = (c22 == 'Z' && c21 != '0'
                                        && rep->_counts[b].zero > 0)
                                           ? '0'
                                           : c22;
                                 c22 = (c22 == 'Z' && c21 != '1'
                                        && rep->_counts[b].one > 0)
                                           ? '1'
                                           : c22;

                                 for (e = 0; e < rep->_nsam; ++e)
                                     {
                                         if (!rep->_haveOutgroup
                                             || (rep->_haveOutgroup
                                                 && e != rep->_outgroup))
                                             if (toupper((*rep->_data)[e][a])
                                                     == c11
                                                 && toupper((*rep->_data)[e][b])
                                                        == c21)
                                                 {
                                                     ++numgametes;
                                                     break;
                                                 }
                                     }
                                 for (e = 0; e < rep->_nsam; ++e)
                                     {
                                         if (!rep->_haveOutgroup
                                             || (rep->_haveOutgroup
                                                 && e != rep->_outgroup))
                                             if (toupper((*rep->_data)[e][a])
                                                     == c11
                                                 && toupper((*rep->_data)[e][b])
                                                        == c22)
                                                 {
                                                     ++numgametes;
                                                     break;
                                                 }
                                     }
                                 for (e = 0; e < rep->_nsam; ++e)
                                     {
                                         if (!rep->_haveOutgroup
                                             || (rep->_haveOutgroup
                                                 && e != rep->_outgroup))
                                             if (toupper((*rep->_data)[e][a])
                                                     == c12
                                                 && toupper((*rep->_data)[e][b])
                                                        == c21)
                                                 {
                                                     ++numgametes;
                                                     break;
                                                 }
                                     }
                                 for (e = 0; e < rep->_nsam; ++e)
                                     {
                                         if (!rep->_haveOutgroup
                                             || (rep->_haveOutgroup
                                                 && e != rep->_outgroup))
                                             if (toupper((*rep->_data)[e][a])
                                                     == c12
                                                 && toupper((*rep->_data)[e][b])
                                                        == c22)
                                                 {
                                                     ++numgametes;
                                                     break;
                                                 }
                                     }
                                 if (numgametes == 4)
                                     {
                                         ++Rmin;
                                         flag = true;
                                         break;
                                     }
                             }
                     }
                 if (flag == true)
                     x = a;
             }
         return Rmin;
     }

     std::vector<PairwiseLDstats>
     PolySNP::Disequilibrium(const unsigned &mincount,
                             const double &max_marker_distance) const
     {
         assert(rep->_preprocessed);
         if (rep->_NumPoly < 2)
             return std::vector<PairwiseLDstats>();
         return Recombination::Disequilibrium(rep->_data, rep->_haveOutgroup,
                                              rep->_outgroup, mincount,
                                              max_marker_distance);
     }
 } // namespace Sequence
Sequence::PolyTable
The base class for polymorphism tables.

operator()
bool operator()(const std::pair< key, value > &l, const std::pair< key, value > &r) const
Definition: CountingOperators.hpp:85

Sequence::PolySNP::FuLiF
virtual double FuLiF(void) const
Definition: PolySNP.cc:1388

Sequence::thetal
double thetal(const AlleleCountMatrix &ac, const std::int8_t refstate)
Zeng et al. .
Definition: thetah_thetal.cc:130

Sequence::PolySNP::VarPi
double VarPi(void) const
Definition: PolySNP.cc:1288

Sequence::Recombination
Methods dealing with recombination.

Sequence::_PolySNPImpl::preprocess
void preprocess(void)
Definition: PolySNP.cc:92

Sequence::PolySNP::NumMutations
virtual unsigned NumMutations(void) const
Definition: PolySNP.cc:823

Sequence::PolySNP::DandVH
double DandVH(void) const
Definition: PolySNP.cc:1614

Sequence::PolySNP::NumSingletons
virtual unsigned NumSingletons(void) const
Definition: PolySNP.cc:844

Sequence::PolySNP::ThetaH
virtual double ThetaH(void) const
Definition: PolySNP.cc:366

Sequence::PolySNP::HudsonsC
double HudsonsC(void) const
Definition: PolySNP.cc:1648

std
STL namespace.

Sequence::PolySNP::NumPoly
unsigned NumPoly(void) const
Definition: PolySNP.cc:807

Sequence::PolySNP::TajimasD
virtual double TajimasD(void) const
Definition: PolySNP.cc:929

PolyTable.hpp
Sequence::PolyTable, a virtual base class for polymorphism tables.

Sequence
The namespace in which this library resides.

Sequence::PolySNP::ThetaW
virtual double ThetaW(void) const
Definition: PolySNP.cc:314

Sequence::PolySNP::b_sub_n
double b_sub_n(void) const
Definition: PolySNP.cc:1537

Sequence::PolySNP::Minrec
virtual unsigned Minrec(void) const
Definition: PolySNP.cc:1665

Sequence::PolySNP::VarThetaW
double VarThetaW(void) const
Definition: PolySNP.cc:1341

Sequence::PolySNP::DandVK
unsigned DandVK(void) const
Definition: PolySNP.cc:1631

PolySNP.hpp
declaration of Sequence::PolySNP, a class to analyze SNP data

Sequence::PolySNP::DepaulisVeuilleStatistics
void DepaulisVeuilleStatistics(void) const
Definition: PolySNP.cc:1050

Sequence::PolySNP::b_sub_n_plus1
double b_sub_n_plus1(void) const
Definition: PolySNP.cc:1552

Sequence::PolySNP::SamplingVarPi
double SamplingVarPi(void) const
Definition: PolySNP.cc:1324

Sequence::PolySNP::WallsB
virtual double WallsB(void) const
Definition: PolySNP.cc:1144

Sequence::PolySNP::a_sub_n_plus1
double a_sub_n_plus1(void) const
Definition: PolySNP.cc:1520

Sequence::Recombination::Disequilibrium
std::vector< PairwiseLDstats > Disequilibrium(const Sequence::PolyTable *data, const bool &haveOutgroup=false, const unsigned &outgroup=0, const unsigned &mincount=1, const double max_distance=std::numeric_limits< double >::max()) __attribute__((deprecated))
Calculate pairwise LD for a Sequence::PolyTable.
Definition: Recombination.cc:353

Sequence::PolySNP::PolySNP
PolySNP(const Sequence::PolyTable *data, bool haveOutgroup=false, unsigned outgroup=0, bool totMuts=true)
Definition: PolySNP.cc:171

Sequence::_PolySNPImpl
Definition: PolySNPimpl.hpp:30

Sequence::PolySNP::FuLiFStar
virtual double FuLiFStar(void) const
Definition: PolySNP.cc:1462

Sequence::PolySNP::NumExternalMutations
virtual unsigned NumExternalMutations(void) const
Definition: PolySNP.cc:885

Sequence::SEQMAXUNSIGNED
const unsigned SEQMAXUNSIGNED
Definition: SeqConstants.cc:32

Sequence::PolySNP::Dnominator
virtual double Dnominator(void) const
Definition: PolySNP.cc:1014

Sequence::PolySNP::ThetaL
virtual double ThetaL(void) const
Definition: PolySNP.cc:594

Sequence::variance
double variance(iterator beg, iterator end)

Sequence::PolySNP::ThetaPi
virtual double ThetaPi(void) const
Definition: PolySNP.cc:193

Sequence::PolySNP::c_sub_n
double c_sub_n(void) const
Definition: PolySNP.cc:1568

Sequence::Recombination::HudsonsC
double HudsonsC(const Sequence::PolyTable *data, const bool &haveOutgroup, const unsigned &outgroup) __attribute__((deprecated))
Definition: Recombination.cc:329

Sequence::PolySNP::WallsBprime
virtual unsigned WallsBprime(void) const
Definition: PolySNP.cc:1262

Sequence::PolySNP::Hprime
virtual double Hprime(const bool &likeThorntonAndolfatto=false) const
Definition: PolySNP.cc:952

Recombination.hpp
namespace Sequence::Recombination

Sequence::PolySNP::a_sub_n
double a_sub_n(void) const
Definition: PolySNP.cc:1504

Sequence::PolySNP::Disequilibrium
std::vector< PairwiseLDstats > Disequilibrium(const unsigned &mincount=1, const double &max_marker_distance=std::numeric_limits< double >::max()) const
Definition: PolySNP.cc:1837

Sequence::PolySNP::WallsQ
virtual double WallsQ(void) const
Definition: PolySNP.cc:1275

Sequence::Different
bool Different(const std::string &seq1, const std::string &seq2, const bool &skip_missing=true, const bool &nucleic_acid=true)
Definition: Comparisons.cc:98

Sequence::PolySNP::d_sub_n
double d_sub_n(void) const
Definition: PolySNP.cc:1595

Sequence::PolySNP::StochasticVarPi
double StochasticVarPi(void) const
Definition: PolySNP.cc:1306

Sequence::PolySNP::FuLiDStar
virtual double FuLiDStar(void) const
Definition: PolySNP.cc:1428

stateCounter.hpp
declaration of Sequence::stateCounter, a class to keep track of nucleotide counts either at a site in...

Comparisons.hpp
delcaration of routines for comparing DNA sequences This file declares a set of functions useful for ...

SeqConstants.hpp

Sequence::PolySNP::FuLiD
virtual double FuLiD(void) const
Definition: PolySNP.cc:1359