lalsuite/lalpulsar/_compute_fstat___demod___compute_fa_fb_8c_source.html

//

// Copyright (C) 2012--2015 Karl Wette

// Copyright (C) 2005--2007, 2009, 2010, 2012, 2014 Reinhard Prix

// Copyright (C) 2007--2010, 2012 Bernd Machenschalk

// Copyright (C) 2007 Chris Messenger

// Copyright (C) 2006 John T. Whelan, Badri Krishnan

//

// This program is free software; you can redistribute it and/or modify

// it under the terms of the GNU General Public License as published by

// the Free Software Foundation; either version 2 of the License, or

// (at your option) any later version.

//

// This program is distributed in the hope that it will be useful,

// but WITHOUT ANY WARRANTY; without even the implied warranty of

// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

// GNU General Public License for more details.

//

// You should have received a copy of the GNU General Public License

// along with with program; see the file COPYING. If not, write to the

// Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,

// MA  02110-1301  USA

//


// this function definition 'template' requires 2 macros to be set:

// FUNC: the function name

// HOTLOOP_SOURCE: the filename to be included containing the hotloop source


int FUNC( COMPLEX8 *Fa, COMPLEX8 *Fb, FstatAtomVector **FstatAtoms, const SFTVector *sfts,

          const PulsarSpins fkdot, const SSBtimes *tSSB, const AMCoeffs *amcoe, const UINT4 Dterms );


// ComputeFaFb: DTERMS define used for loop unrolling in some hotloop variants

#define DTERMS 8

#define LD_SMALL4       (2.0e-4)                /* "small" number for REAL4*/

#define OOTWOPI         (1.0 / LAL_TWOPI)       /* 1/2pi */

#define TWOPI_FLOAT     6.28318530717958f       /* single-precision 2*pi */

#define OOTWOPI_FLOAT   (1.0f / TWOPI_FLOAT)    /* single-precision 1 / (2pi) */


// somehow the branch prediction of gcc-4.1.2 terribly fails

// So let's give gcc a hint which path has a higher probablility

#ifdef __GNUC__

#define likely(x)       __builtin_expect((x),1)

#else

#define likely(x)       (x)

#endif


// Revamped version of LALDemod() (based on TestLALDemod() in CFS).

// Compute JKS's Fa and Fb, which are ingredients for calculating the F-statistic.

int

FUNC( COMPLEX8 *Fa,                         /* [out] Fa returned */

      COMPLEX8 *Fb,                         /* [out] Fb returned */

      FstatAtomVector **FstatAtoms,         /* [in,out] if !NULL: return Fstat atoms vector */

      const SFTVector *sfts,                /* [in] input SFTs */

      const PulsarSpins fkdot,              /* [in] frequency and derivatives fkdot = d^kf/dt^k */

      const SSBtimes *tSSB,                 /* [in] SSB timing series for particular sky-direction */

      const AMCoeffs *amcoe,                /* [in] antenna-pattern coefficients for this sky-direction */

      const UINT4 Dterms                    /* [in] Dterms to keep in Dirichlet kernel */

    )

{


  /* ----- check validity of input */

  if ( !Fa || !Fb ) {

    XLALPrintError( "\nOutput-pointer is NULL !\n\n" );

    XLAL_ERROR( XLAL_EINVAL );

  }


  if ( !sfts || !sfts->data ) {

    XLALPrintError( "\nInput SFTs are NULL!\n\n" );

    XLAL_ERROR( XLAL_EINVAL );

  }


  if ( !tSSB || !tSSB->DeltaT || !tSSB->Tdot || !amcoe || !amcoe->a || !amcoe->b ) {

    XLALPrintError( "\nIllegal NULL in input !\n\n" );

    XLAL_ERROR( XLAL_EINVAL );

  }


  if ( PULSAR_MAX_SPINS > LAL_FACT_MAX ) {

    XLALPrintError( "\nInverse factorials table only up to order s=%d, can't handle %d spin-order\n\n",

                    LAL_FACT_MAX, PULSAR_MAX_SPINS - 1 );

    XLAL_ERROR( XLAL_EINVAL );

  }


  UINT4 alpha;                  /* loop index over SFTs */

  UINT4 spdnOrder;              /* maximal spindown-orders */

  UINT4 numSFTs;                /* number of SFTs (M in the Notes) */

  REAL8 Tsft;                   /* length of SFTs in seconds */

  INT4 freqIndex0;              /* index of first frequency-bin in SFTs */

  INT4 freqIndex1;              /* index of last frequency-bin in SFTs */


  REAL4 *a_al, *b_al;           /* pointer to alpha-arrays over a and b */

  REAL8 *DeltaT_al, *Tdot_al;   /* pointer to alpha-arrays of SSB-timings */

  SFTtype *SFT_al;              /* SFT alpha  */


  /* ----- prepare convenience variables */

  numSFTs = sfts->length;

  Tsft = 1.0 / sfts->data[0].deltaF;

  {

    REAL8 dFreq = sfts->data[0].deltaF;

    freqIndex0 = ( UINT4 )( sfts->data[0].f0 / dFreq + 0.5 ); /* lowest freqency-index */

    freqIndex1 = freqIndex0 + sfts->data[0].data->length;

  }


  // locally initialize sin/cos lookuptable, as some hotloops use that directly

  static int firstcall = 1;

  if ( firstcall ) {

    XLALSinCosLUTInit();

    firstcall = 0;

  }


  /* ----- prepare return of 'FstatAtoms' if requested */

  if ( FstatAtoms != NULL ) {

    XLAL_CHECK( ( *FstatAtoms == NULL ), XLAL_EINVAL );

    XLAL_CHECK( ( ( *FstatAtoms ) = XLALCreateFstatAtomVector( numSFTs ) ) != NULL, XLAL_EFUNC );


    ( *FstatAtoms )->TAtom = Tsft;   /* time-baseline of returned atoms is Tsft */


  } /* if returnAtoms */


  // ----- find highest non-zero spindown-entry ----------

  for ( spdnOrder = PULSAR_MAX_SPINS - 1;  spdnOrder > 0 ; spdnOrder -- )

    if ( fkdot[spdnOrder] != 0.0 ) {

      break;

    }


  ( *Fa ) = 0.0f;

  ( *Fb ) = 0.0f;


  a_al = amcoe->a->data;        /* point to beginning of alpha-arrays */

  b_al = amcoe->b->data;

  DeltaT_al = tSSB->DeltaT->data;

  Tdot_al = tSSB->Tdot->data;

  SFT_al = sfts->data;


  /* Loop over all SFTs  */

  for ( alpha = 0; alpha < numSFTs; alpha++ ) {

    REAL4 a_alpha, b_alpha;


    INT4 kstar;               /* central frequency-bin k* = round(xhat_alpha) */

    INT4 k0, k1;


    COMPLEX8 *Xalpha = SFT_al->data->data; /* pointer to current SFT-data */

    REAL4 realQ, imagQ;       /* Re and Im of Q = e^{i 2 pi lambda_alpha} */

    REAL4 realXP, imagXP;     /* Re/Im of sum_k X_ak * P_ak */

    REAL4 realQXP, imagQXP;   /* Re/Im of Q_alpha R_alpha */


    REAL8 lambda_alpha, kappa_star;


    /* ----- calculate lambda_alpha */

    {

      UINT4 s;                /* loop-index over spindown-order */

      REAL8 phi_alpha, Dphi_alpha, DT_al;

      REAL8 Tas;      /* temporary variable to calculate (DeltaT_alpha)^s */

      REAL8 TAS_invfact_s;


      /* init for s=0 */

      phi_alpha = 0.0;

      Dphi_alpha = 0.0;

      DT_al = ( *DeltaT_al );

      Tas = 1.0;              /* DeltaT_alpha ^ 0 */

      TAS_invfact_s = 1.0;  /* TAS / s! */


      for ( s = 0; s <= spdnOrder; s++ ) {

        REAL8 fsdot = fkdot[s];

        Dphi_alpha += fsdot * TAS_invfact_s;  /* here: DT^s/s! */

        Tas *= DT_al;                         /* now: DT^(s+1) */

        TAS_invfact_s = Tas * LAL_FACT_INV[s + 1];

        phi_alpha += fsdot * TAS_invfact_s;

      } /* for s <= spdnOrder */


      /* Step 3: apply global factors to complete Dphi_alpha */

      Dphi_alpha *= Tsft * ( *Tdot_al );              /* guaranteed > 0 ! */

      lambda_alpha = 0.5 * Dphi_alpha - phi_alpha;


      kstar = ( INT4 )( Dphi_alpha ); /* k* = floor(Dphi_alpha) for positive Dphi */

      kappa_star = Dphi_alpha - 1.0 * kstar;  /* remainder of Dphi_alpha: >= 0 ! */


      /* ----- check that required frequency-bins are found in the SFTs ----- */

      k0 = kstar - Dterms + 1;

      k1 = kstar + Dterms;


      if ( ( k0 < freqIndex0 ) || ( k1 > freqIndex1 ) ) {

        XLAL_ERROR( XLAL_EDOM, "Required frequency-bins [%d, %d] not covered by SFT-interval [%d, %d]\n"

                    "\t\t[Parameters: alpha:%d, Dphi_alpha:%e, Tsft:%e, *Tdot_al:%e]\n",

                    k0, k1, freqIndex0, freqIndex1, alpha, Dphi_alpha, Tsft, *Tdot_al );

      }


    } /* compute kappa_star, lambda_alpha */


    /* ---------- calculate the (truncated to Dterms) sum over k ---------- */


    /* ---------- ATTENTION: this the "hot-loop", which will be

     * executed many millions of times, so anything in here

     * has a HUGE impact on the whole performance of the code.

     *

     * DON'T touch *anything* in here unless you really know

     * what you're doing !!

     *------------------------------------------------------------

     */

    {

      // ----- start: hotloop ----------

      COMPLEX8 *Xalpha_l = Xalpha + k0 - freqIndex0;  /* first frequency-bin in sum */


      /* somehow the branch prediction of gcc-4.1.2 terribly failes

         with the current case distinction in the hot-loop,

         having a severe impact on runtime of the E@H Linux App.

         So let's allow to give gcc a hint which path has a higher probablility */

      if ( likely( ( kappa_star > LD_SMALL4 ) && ( kappa_star < 1.0 - LD_SMALL4 ) ) ) {

        /* if |remainder| > LD_SMALL4, ie no danger of denominator -> 0 */


#include HOTLOOP_SOURCE


      } /* if  */

      else {

        /* otherwise: lim_{rem->0}P_alpha,k  = 2pi delta_{k,kstar} */

        UINT4 ind0;


        /* real- and imaginary part of e^{i 2 pi lambda_alpha } */

        XLALSinCos2PiLUT( &imagQ, &realQ, lambda_alpha );


        if ( kappa_star <= LD_SMALL4 ) {

          ind0 = Dterms - 1;

        } else {

          ind0 = Dterms;

        }


        realXP = TWOPI_FLOAT * crealf( Xalpha_l[ind0] );

        imagXP = TWOPI_FLOAT * cimagf( Xalpha_l[ind0] );


      } /* if |remainder| <= LD_SMALL4 */


    } // ----- end: hotloop ----------


    /* real- and imaginary part of e^{i 2 pi lambda_alpha } */

    realQXP = realQ * realXP - imagQ * imagXP;

    imagQXP = realQ * imagXP + imagQ * realXP;


    /* we're done: ==> combine these into Fa and Fb */

    a_alpha = ( *a_al );

    b_alpha = ( *b_al );


    COMPLEX8 Fa_alpha = crect( a_alpha * realQXP, a_alpha * imagQXP );

    ( *Fa ) += Fa_alpha;


    COMPLEX8 Fb_alpha = crect( b_alpha * realQXP, b_alpha * imagQXP );

    ( *Fb ) += Fb_alpha;


    /* store per-SFT F-stat 'atoms' for transient-CW search */

    if ( FstatAtoms != NULL ) {

      ( *FstatAtoms )->data[alpha].timestamp  = SFT_al->epoch.gpsSeconds;

      ( *FstatAtoms )->data[alpha].a2_alpha   = a_alpha * a_alpha;

      ( *FstatAtoms )->data[alpha].b2_alpha   = b_alpha * b_alpha;

      ( *FstatAtoms )->data[alpha].ab_alpha   = a_alpha * b_alpha;

      ( *FstatAtoms )->data[alpha].Fa_alpha   = OOTWOPI * Fa_alpha;

      ( *FstatAtoms )->data[alpha].Fb_alpha   = OOTWOPI * Fb_alpha;

    }


    /* advance pointers over alpha */

    a_al ++;

    b_al ++;

    DeltaT_al ++;

    Tdot_al ++;

    SFT_al ++;


  } /* for alpha < numSFTs */


  /* return result */

  ( *Fa ) *= OOTWOPI;

  ( *Fb ) *= OOTWOPI;


  return XLAL_SUCCESS;


} // FUNC()

LD_SMALL4
#define LD_SMALL4
Definition: ComputeFstat_Demod_ComputeFaFb.c:33

likely
#define likely(x)
Definition: ComputeFstat_Demod_ComputeFaFb.c:41

TWOPI_FLOAT
#define TWOPI_FLOAT
Definition: ComputeFstat_Demod_ComputeFaFb.c:35

FUNC
int FUNC(COMPLEX8 *Fa, COMPLEX8 *Fb, FstatAtomVector **FstatAtoms, const SFTVector *sfts, const PulsarSpins fkdot, const SSBtimes *tSSB, const AMCoeffs *amcoe, const UINT4 Dterms)
Definition: ComputeFstat_Demod_ComputeFaFb.c:49

OOTWOPI
#define OOTWOPI
Definition: ComputeFstat_Demod_ComputeFaFb.c:34

k0
coeffs k0

k1
coeffs k1

XLALCreateFstatAtomVector
FstatAtomVector * XLALCreateFstatAtomVector(const UINT4 length)
Create a FstatAtomVector of the given length.
Definition: ComputeFstat.c:276

LAL_FACT_INV
static const REAL8 LAL_FACT_INV[]

LAL_FACT_MAX
#define LAL_FACT_MAX

crect
#define crect(re, im)

REAL8
double REAL8

UINT4
uint32_t UINT4

COMPLEX8
float complex COMPLEX8

INT4
int32_t INT4

REAL4
float REAL4

PulsarSpins
REAL8 PulsarSpins[PULSAR_MAX_SPINS]
Typedef for fixed-size array holding GW frequency and derivatives fk = d^k Freq/dt^k|(tau_ref)
Definition: PulsarDataTypes.h:127

PULSAR_MAX_SPINS
#define PULSAR_MAX_SPINS
maximal number of spin-parameters (Freq + spindowns) we can handle
Definition: PulsarDataTypes.h:108

XLALSinCos2PiLUT
int XLALSinCos2PiLUT(REAL4 *sin2pix, REAL4 *cos2pix, REAL8 x)
Calculate sin(2*pi*x) and cos(2*pi*x) to roughly 1e-7 precision using a lookup-table and Taylor-expan...
Definition: SinCosLUT.c:97

XLALSinCosLUTInit
void XLALSinCosLUTInit(void)
Definition: SinCosLUT.c:49

XLAL_ERROR
#define XLAL_ERROR(...)

XLAL_CHECK
#define XLAL_CHECK(assertion,...)

XLALPrintError
int XLALPrintError(const char *fmt,...) _LAL_GCC_PRINTF_FORMAT_(1

XLAL_SUCCESS
XLAL_SUCCESS

XLAL_EFUNC
XLAL_EFUNC

XLAL_EDOM
XLAL_EDOM

XLAL_EINVAL
XLAL_EINVAL

lalpulsar_PiecewiseSearch.s
s
Definition: lalpulsar_PiecewiseSearch.py:957

lalpulsar_PiecewiseSearch.Tsft
Tsft
Definition: lalpulsar_PiecewiseSearch.py:598

test_computePSD.numSFTs
numSFTs
Definition: test_computePSD.py:68

alpha
double alpha

AMCoeffs
This structure contains the per-SFT (weighted) antenna-pattern functions  , with  the SFT-index,...
Definition: LALComputeAM.h:63

AMCoeffs::b
REAL4Vector * b
(weighted) per-SFT  antenna-pattern function
Definition: LALComputeAM.h:65

AMCoeffs::a
REAL4Vector * a
(weighted) per-SFT  antenna-pattern function
Definition: LALComputeAM.h:64

COMPLEX8FrequencySeries

COMPLEX8FrequencySeries::epoch
LIGOTimeGPS epoch

COMPLEX8FrequencySeries::f0
REAL8 f0

COMPLEX8FrequencySeries::deltaF
REAL8 deltaF

COMPLEX8FrequencySeries::data
COMPLEX8Sequence * data

COMPLEX8FrequencySeriesVector
A vector of COMPLEX8FrequencySeries.
Definition: PulsarDataTypes.h:70

COMPLEX8FrequencySeriesVector::data
COMPLEX8FrequencySeries * data
Pointer to the data array.
Definition: PulsarDataTypes.h:75

COMPLEX8FrequencySeriesVector::length
UINT4 length
Number of elements in array.
Definition: PulsarDataTypes.h:74

COMPLEX8Vector::length
UINT4 length

COMPLEX8Vector::data
COMPLEX8 * data

FstatAtomVector
A vector of  -statistic 'atoms', i.e.
Definition: ComputeFstat.h:175

LIGOTimeGPS::gpsSeconds
INT4 gpsSeconds

REAL4Vector::data
REAL4 * data

REAL8Vector::data
REAL8 * data

SSBtimes
Simple container for two REAL8-vectors, namely the SSB-timings DeltaT_alpha and Tdot_alpha,...
Definition: SSBtimes.h:60

SSBtimes::Tdot
REAL8Vector * Tdot
dT/dt : time-derivative of SSB-time wrt local time for SFT-alpha
Definition: SSBtimes.h:63

SSBtimes::DeltaT
REAL8Vector * DeltaT
Time-difference of SFT-alpha - tau0 in SSB-frame.
Definition: SSBtimes.h:62