Implement CUDA IProductWRTDerivBase sum-factorization kernels
Merged
requested to merge CFD-Xing/redesign-prototypes:iproductderivbase_sum_fac_cuda_kernels into master
1 unresolved thread
Compare changes
Files
14@@ -6,14 +8,16 @@
@@ -21,16 +25,20 @@ void IProductWRTBase2DKernel(const size_t gridSize, const size_t blockSize,
@@ -49,7 +57,7 @@ public:
@@ -58,25 +66,14 @@ public:
@@ -126,15 +123,33 @@ public:
@@ -150,17 +165,37 @@ public:
@@ -180,17 +215,37 @@ public:
@@ -220,18 +275,19 @@ private:
@@ -239,67 +295,67 @@ void IProductWRTBase2DKernel(const size_t gridSize, const size_t blockSize,