cms-patatrack · fwyzard · May 15, 2019 · Feb 14, 2019 · May 13, 2019
diff --git a/HeterogeneousCore/CUDAUtilities/interface/cudaCompat.h b/HeterogeneousCore/CUDAUtilities/interface/cudaCompat.h
@@ -0,0 +1,94 @@
+#ifndef HeterogeneousCore_CUDAUtilities_interface_cudaCompat_h
+#define HeterogeneousCore_CUDAUtilities_interface_cudaCompat_h
+
+/*
+ * Everything you need to run cuda code in plain sequential c++ code
+ */
+
+#ifndef __CUDACC__
+
+#include <algorithm>
+#include <cstdint>
+#include <cstring>
+
+#include <cuda_runtime.h>
+
+namespace cudaCompat {
+
+#ifndef __CUDA_RUNTIME_H__
+  struct dim3 {
+    uint32_t x, y, z;
+  };
+#endif
+  const dim3 threadIdx = {0, 0, 0};
+  const dim3 blockDim = {1, 1, 1};
+
+  extern thread_local dim3 blockIdx;
+  extern thread_local dim3 gridDim;
+
+  template <typename T1, typename T2>
+  T1 atomicInc(T1* a, T2 b) {
+    auto ret = *a;
+    if ((*a) < T1(b))
+      (*a)++;
+    return ret;
+  }
+
+  template <typename T1, typename T2>
+  T1 atomicAdd(T1* a, T2 b) {
+    auto ret = *a;
+    (*a) += b;
+    return ret;
+  }
+
+  template <typename T1, typename T2>
+  T1 atomicSub(T1* a, T2 b) {
+    auto ret = *a;
+    (*a) -= b;
+    return ret;
+  }
+
+  template <typename T1, typename T2>
+  T1 atomicMin(T1* a, T2 b) {
+    auto ret = *a;
+    *a = std::min(*a, b);
+    return ret;
+  }
+  template <typename T1, typename T2>
+  T1 atomicMax(T1* a, T2 b) {
+    auto ret = *a;
+    a = std::max(*a, b);
+    return ret;
+  }
+
+  inline void __syncthreads() {}
+  inline void __threadfence() {}
+  inline bool __syncthreads_or(bool x) { return x; }
+  inline bool __syncthreads_and(bool x) { return x; }
+  template <typename T>
+  inline T __ldg(T const* x) {
+    return *x;
+  }
+
+  inline void resetGrid() {
+    blockIdx = {0, 0, 0};
+    gridDim = {1, 1, 1};
+  }
+
+}  // namespace cudaCompat
+
+#ifndef __CUDA_RUNTIME_H__
+#define __host__
+#define __device__
+#define __global__
+#define __shared__
+#define __forceinline__
+#endif
+
+#ifndef __CUDA_ARCH__
+using namespace cudaCompat;
+#endif
+
+#endif
+
+#endif  // HeterogeneousCore_CUDAUtilities_interface_cudaCompat_h
diff --git a/HeterogeneousCore/CUDAUtilities/src/cudaCompat.cc b/HeterogeneousCore/CUDAUtilities/src/cudaCompat.cc
@@ -0,0 +1,15 @@
+#include "HeterogeneousCore/CUDAUtilities/interface/cudaCompat.h"
+
+namespace cudaCompat {
+  thread_local dim3 blockIdx;
+  thread_local dim3 gridDim;
+}  // namespace cudaCompat
+
+namespace {
+  struct InitGrid {
+    InitGrid() { cudaCompat::resetGrid(); }
+  };
+
+  const InitGrid initGrid;
+
+}  // namespace