123456789101112131415161718 |
- #pragma once
- namespace vision {
- namespace ops {
- #define CUDA_1D_KERNEL_LOOP_T(i, n, index_t) \
- for (index_t i = (blockIdx.x * blockDim.x) + threadIdx.x; i < (n); \
- i += (blockDim.x * gridDim.x))
- #define CUDA_1D_KERNEL_LOOP(i, n) CUDA_1D_KERNEL_LOOP_T(i, n, int)
- template <typename integer>
- constexpr __host__ __device__ inline integer ceil_div(integer n, integer m) {
- return (n + m - 1) / m;
- }
- } // namespace ops
- } // namespace vision
|