HILA/KennedyPendleton_8h_source.html

#ifndef KENNEDY_PENDLETON_H

#define KENNEDY_PENDLETON_H


#include "plumbing/hila.h"

#include "datatypes/su2.h"


// this is might be too much to have in a single kernel


/**

 * @brief \f$ SU(2) \f$ heatbath

 * @details Generate an \f$ SU(2)\f$ matrix according to Kennedy-Pendleton heatbath.

 * This assumes that the action due to gauge link U is Re Tr U.S^+,

 * where S is the staple. Note sign and normalization of the staple (beta is absorbed in S),

 * and we include hermitian conjugation in definition of the staple for consistency with conventions elsewhere in HILA.

 * @tparam T float-type

 * @param staple Hermitian conjugate of the staple to compute heatbath with. Action ~ Re Tr U.S^+, so this input is S.

 * NB: In general the staple is NOT an SU(2) matrix,

 * however we can describe it using the SU2 class because (i) The sum of SU(2) matrices is proportional to SU(2),

 * (ii) SU2 class does not require that the determinant is always normalized to 1.

 *

 * @return SU2<T>

 */

template <typename T>

SU2<T> KennedyPendleton(const SU2<T> &staple) {


    // action Tr U.S^+ => weight exp(-Tr U.S^+)  (for SU2 the trace is real).

    // Following K-P we need to bring this to form exp(xi Tr a),

    // where a is an SU2 matrix. For this we could project the staple to SU2 (eq. (10) of K-P paper).

    // But since the staple is proportional to SU2 matrix,

    // this just means we normalize by its det and flip the sign:

    // V = S/sqrt(|S|) =>   xi = 1/sqrt(|S|), a = -U.V^+

    // The K-P algorithm generates a new SU2 matrix a = -U.V^+

    // from which the new link U is -a.V.

    // This way of writing things minimizes the needed number of conjugations


    const T xi = ::sqrt(det(staple));

    const SU2<T> V = staple / xi; // this is now in SU(2)


    // 'alpha' that appears in eq (15)

    T alpha = 2.0*xi;


    // Now generate new a = -U.V^+, section 4 of K-P


    int nloops;

    const int LOOPLIM = 100;

    const double pi2 = M_PI * 2.0;

    double r1, r2, r3, delta;

    nloops = 0;

    do {

        // r1, r2 need division by alpha but this is done in one go when setting delta (micro-optimization?)

        r1 = -::log(1.0 - hila::random());

        r2 = -::log(1.0 - hila::random());

        r3 = ::cos(pi2 * hila::random());

        r3 *= r3;

        delta = (r1*r3 + r2) / alpha;


        r3 = hila::random(); // R'''

        nloops++;

    } while (nloops < LOOPLIM && r3*r3 > 1.0 - 0.5*delta);


    T a0 = 1.0 - delta;

    if (nloops >= LOOPLIM) {

        // Failed to find new a0...

        // TODO some error or warning

        a0 = 1e-9;

    }


    // Generate random vector on S2, radius sqrt(1.0-a0**2)

    T rd = 1.0 - a0*a0;


    if (rd <= 0.0) {

        // negative radius^2, something went wrong...

        // TODO some error or warning

        rd = 0.0;

    }


    // ... and put them in the 'a' matrix. Notation gets messy, reminder:

    // SU2 = d + a i\sigma_1 + b i\sigma_2 + c i\sigma_3$

    SU2<T> a;

    a.d = a0;


    r3 = 2.0 * hila::random() - 1.0;

    a.c = ::sqrt(rd) * r3;

    T theta = pi2 * hila::random();

    rd = ::sqrt(rd * (1.0 - ::sqr(r3)));

    a.b = rd * ::cos(theta);

    a.a = rd * ::sin(theta);

    // Could this be optimized by removing sin, cos? http://corysimon.github.io/articles/uniformdistn-on-sphere/


    // Now just get the new link variable from a = -U.V^+

    return -a * V;

}


#endif

cos
Array< n, m, T > cos(Array< n, m, T > a)
Cosine.
Definition array.h:1089

sqrt
Array< n, m, T > sqrt(Array< n, m, T > a)
Square root.
Definition array.h:1039

sin
Array< n, m, T > sin(Array< n, m, T > a)
Sine.
Definition array.h:1079

log
Array< n, m, T > log(Array< n, m, T > a)
Logarithm.
Definition array.h:1069

SU2
Definition su2.h:14

sqr
constexpr T sqr(const T &arg)
Define convenience function sqr(), returning square of argument.
Definition defs.h:160

hila::random
double random()
Real valued uniform random number generator.
Definition hila_gpu.cpp:121