MaCh3/gpuSplineUtils_8cuh_source.html

//MaCh3 included

#include "Manager/gpuUtils.cuh"

#include "Splines/SplineCommon.h"


__host__ void SynchroniseSplines();


__global__ void EvalOnGPU_Splines(

    const short int* __restrict__ gpu_paramNo_arr,

    const unsigned int* __restrict__ gpu_nKnots_arr,

    const float* __restrict__ gpu_coeff_many,

    float* __restrict__ gpu_weights,

    const cudaTextureObject_t __restrict__ text_coeff_x);


__global__ void EvalOnGPU_TF1(

  const float* __restrict__ gpu_coeffs_tf1,

  const short int* __restrict__ gpu_paramNo_arr_tf1,

  float* __restrict__ gpu_weights_tf1);


#ifndef Weight_On_SplineBySpline_Basis

__global__ void EvalOnGPU_TotWeight(

  const float* __restrict__ gpu_weights,

  const float* __restrict__ gpu_weights_tf1,


  float* __restrict__ gpu_total_weights,


  const cudaTextureObject_t __restrict__ text_nParamPerEvent,

  const cudaTextureObject_t __restrict__ text_nParamPerEvent_TF1);

#endif


class SMonolithGPU

{

  public:

    SMonolithGPU();

    virtual ~SMonolithGPU();


    __host__ void InitGPU_SplineMonolith(

      #ifndef Weight_On_SplineBySpline_Basis

      float **cpu_total_weights,

      int n_events,

      #endif

      unsigned int total_nknots,

      unsigned int n_splines,

      unsigned int n_tf1,

      int Eve_size);


    __host__ void CopyToGPU_SplineMonolith(

      SplineMonoStruct* cpu_spline_handler,


      // TFI related now

      std::vector<float> cpu_many_array_TF1,

      std::vector<short int> cpu_paramNo_arr_TF1,

      #ifndef Weight_On_SplineBySpline_Basis

      int n_events,

      std::vector<unsigned int> cpu_nParamPerEvent,

      // TFI related now

      std::vector<unsigned int> cpu_nParamPerEvent_TF1,

      #endif

      int n_params,

      unsigned int n_splines,

      short int spline_size,

      unsigned int total_nknots,

      unsigned int n_tf1);


    __host__ void InitGPU_Segments(short int **segment);


    __host__ void InitGPU_Vals(float **vals);


    __host__ void RunGPU_SplineMonolith(

      #ifdef Weight_On_SplineBySpline_Basis

      float* cpu_weights,

      float* cpu_weights_tf1,

      #else

      float* cpu_total_weights,

      #endif

      // Holds the changes in parameters

      float *vals,

      // Holds the segments for parameters

      short int *segment,

      const unsigned int h_n_splines,

      const unsigned int h_n_tf1);


    __host__ void CleanupGPU_SplineMonolith(

      #ifndef Weight_On_SplineBySpline_Basis

      float *cpu_total_weights

      #endif

      );


    __host__ void CleanupGPU_Segments(short int *segment, float *vals);


  private:

    unsigned int *gpu_nParamPerEvent;

    unsigned int *gpu_nParamPerEvent_TF1;


    float *gpu_coeff_x;


    float *gpu_coeff_many;


    unsigned int *gpu_nKnots_arr;


    short int *gpu_paramNo_arr;


    float *gpu_coeff_TF1_many;

    short int *gpu_nPoints_arr;

    short int *gpu_paramNo_TF1_arr;


    float *gpu_total_weights;

    float *gpu_weights;

    float *gpu_weights_tf1;


    // h_NAME declares HOST constants (live on CPU)

    int h_n_params;

    int h_n_events;


    // ******************************************

    // TEXTURES

    // ******************************************

    cudaTextureObject_t text_coeff_x = 0;

    #ifndef Weight_On_SplineBySpline_Basis

    cudaTextureObject_t text_nParamPerEvent = 0;

    cudaTextureObject_t text_nParamPerEvent_TF1 = 0;

    #endif

};


SplineCommon.h
Contains definitions for spline coefficients and structure used in both CPU and GPU code.

SMonolithGPU
Class responsible for calculating spline weight on GPU.
Definition: gpuSplineUtils.cuh:62

SMonolithGPU::text_nParamPerEvent_TF1
cudaTextureObject_t text_nParamPerEvent_TF1
KS: Map keeping track how many parameters applies to each event, we keep two numbers here {number of ...
Definition: gpuSplineUtils.cuh:229

SMonolithGPU::gpu_nParamPerEvent
unsigned int * gpu_nParamPerEvent
KS: GPU map keeping track how many parameters applies to each event, we keep two numbers here {number...
Definition: gpuSplineUtils.cuh:184

SMonolithGPU::CleanupGPU_SplineMonolith
__host__ void CleanupGPU_SplineMonolith(float *cpu_total_weights)
This function deallocates the resources allocated for the separate {x} and {ybcd} arrays in the and T...
Definition: gpuSplineUtils.cu:552

SMonolithGPU::text_coeff_x
cudaTextureObject_t text_coeff_x
KS: Textures are L1 cache variables which are well optimised for fetching. Make texture only for vari...
Definition: gpuSplineUtils.cuh:224

SMonolithGPU::gpu_paramNo_TF1_arr
short int * gpu_paramNo_TF1_arr
CW: GPU array with the number of points per TF1 object.
Definition: gpuSplineUtils.cuh:205

SMonolithGPU::InitGPU_Vals
__host__ void InitGPU_Vals(float **vals)
Allocate memory for spline segments.
Definition: gpuSplineUtils.cu:187

SMonolithGPU::h_n_events
int h_n_events
Number of events living on CPU.
Definition: gpuSplineUtils.cuh:218

SMonolithGPU::gpu_weights
float * gpu_weights
GPU arrays to hold weight for each spline.
Definition: gpuSplineUtils.cuh:210

SMonolithGPU::gpu_coeff_many
float * gpu_coeff_many
GPU arrays to hold other coefficients.
Definition: gpuSplineUtils.cuh:192

SMonolithGPU::gpu_nParamPerEvent_TF1
unsigned int * gpu_nParamPerEvent_TF1
KS: GPU map keeping track how many parameters applies to each event, we keep two numbers here {number...
Definition: gpuSplineUtils.cuh:186

SMonolithGPU::text_nParamPerEvent
cudaTextureObject_t text_nParamPerEvent
KS: Map keeping track how many parameters applies to each event, we keep two numbers here {number of ...
Definition: gpuSplineUtils.cuh:227

SMonolithGPU::InitGPU_SplineMonolith
__host__ void InitGPU_SplineMonolith(float **cpu_total_weights, int n_events, unsigned int total_nknots, unsigned int n_splines, unsigned int n_tf1, int Eve_size)
Allocate memory on gpu for spline monolith.
Definition: gpuSplineUtils.cu:106

SMonolithGPU::~SMonolithGPU
virtual ~SMonolithGPU()
destructor
Definition: gpuSplineUtils.cu:100

SMonolithGPU::RunGPU_SplineMonolith
__host__ void RunGPU_SplineMonolith(float *cpu_total_weights, float *vals, short int *segment, const unsigned int h_n_splines, const unsigned int h_n_tf1)
Run the GPU code for the separate many arrays. As in separate {x}, {y,b,c,d} arrays Pass the segment ...
Definition: gpuSplineUtils.cu:459

SMonolithGPU::gpu_coeff_x
float * gpu_coeff_x
KS: GPU arrays to hold X coefficient.
Definition: gpuSplineUtils.cuh:189

SMonolithGPU::SMonolithGPU
SMonolithGPU()
constructor
Definition: gpuSplineUtils.cu:81

SMonolithGPU::gpu_nPoints_arr
short int * gpu_nPoints_arr
GPU arrays to hold number of points.
Definition: gpuSplineUtils.cuh:203

SMonolithGPU::gpu_weights_tf1
float * gpu_weights_tf1
GPU arrays to hold weight for each TF1.
Definition: gpuSplineUtils.cuh:212

SMonolithGPU::InitGPU_Segments
__host__ void InitGPU_Segments(short int **segment)
Allocate memory for spline segments.
Definition: gpuSplineUtils.cu:178

SMonolithGPU::gpu_nKnots_arr
unsigned int * gpu_nKnots_arr
KS: GPU Number of knots per spline.
Definition: gpuSplineUtils.cuh:195

SMonolithGPU::h_n_params
int h_n_params
Number of params living on CPU.
Definition: gpuSplineUtils.cuh:216

SMonolithGPU::gpu_coeff_TF1_many
float * gpu_coeff_TF1_many
GPU arrays to hold TF1 coefficients.
Definition: gpuSplineUtils.cuh:201

SMonolithGPU::gpu_paramNo_arr
short int * gpu_paramNo_arr
CW: GPU array with the number of points per spline (not per spline point!)
Definition: gpuSplineUtils.cuh:198

SMonolithGPU::CopyToGPU_SplineMonolith
__host__ void CopyToGPU_SplineMonolith(SplineMonoStruct *cpu_spline_handler, std::vector< float > cpu_many_array_TF1, std::vector< short int > cpu_paramNo_arr_TF1, int n_events, std::vector< unsigned int > cpu_nParamPerEvent, std::vector< unsigned int > cpu_nParamPerEvent_TF1, int n_params, unsigned int n_splines, short int spline_size, unsigned int total_nknots, unsigned int n_tf1)
Copies data from CPU to GPU for the spline monolith.
Definition: gpuSplineUtils.cu:201

SMonolithGPU::gpu_total_weights
float * gpu_total_weights
GPU arrays to hold weight for event.
Definition: gpuSplineUtils.cuh:208

SMonolithGPU::CleanupGPU_Segments
__host__ void CleanupGPU_Segments(short int *segment, float *vals)
Clean up pinned variables at CPU.
Definition: gpuSplineUtils.cu:587

EvalOnGPU_TotWeight
__global__ void EvalOnGPU_TotWeight(const float *__restrict__ gpu_weights, const float *__restrict__ gpu_weights_tf1, float *__restrict__ gpu_total_weights, const cudaTextureObject_t __restrict__ text_nParamPerEvent, const cudaTextureObject_t __restrict__ text_nParamPerEvent_TF1)
KS: Evaluate the total spline event weight on the GPU, as in most cases GPU is faster,...
Definition: gpuSplineUtils.cu:424

EvalOnGPU_Splines
__global__ void EvalOnGPU_Splines(const short int *__restrict__ gpu_paramNo_arr, const unsigned int *__restrict__ gpu_nKnots_arr, const float *__restrict__ gpu_coeff_many, float *__restrict__ gpu_weights, const cudaTextureObject_t __restrict__ text_coeff_x)
Evaluate the spline on the GPU Using one {y,b,c,d} array and one {x} array Should be most efficient a...
Definition: gpuSplineUtils.cu:348

SynchroniseSplines
__host__ void SynchroniseSplines()
Make sure all Cuda threads finished execution.
Definition: gpuSplineUtils.cu:73

EvalOnGPU_TF1
__global__ void EvalOnGPU_TF1(const float *__restrict__ gpu_coeffs_tf1, const short int *__restrict__ gpu_paramNo_arr_tf1, float *__restrict__ gpu_weights_tf1)
Evaluate the TF1 on the GPU Using 5th order polynomial.
Definition: gpuSplineUtils.cu:397

gpuUtils.cuh
Common CUDA utilities and definitions for shared GPU functionality.

SplineMonoStruct
KS: Struct storing information for spline monolith.
Definition: SplineCommon.h:30