#pragma once #include namespace at { class TensorBase; namespace native { // NOTE: these functions require output tensors to be contiguous void launch_cummax_cuda_kernel(const TensorBase& self, const TensorBase& values, const TensorBase& indices, int64_t dim); void launch_cummin_cuda_kernel(const TensorBase& self, const TensorBase& values, const TensorBase& indices, int64_t dim); void launch_logcumsumexp_cuda_kernel(const TensorBase& result, const TensorBase& self, int64_t dim); void launch_cumsum_cuda_kernel(const TensorBase& result, const TensorBase& self, int64_t dim); void launch_cumprod_cuda_kernel(const TensorBase& result, const TensorBase& self, int64_t dim); }} // namespace at::native