blockReduce 63 modules/cudev/include/opencv2/cudev/block/reduce.hpp __device__ __forceinline__ void blockReduce(volatile T* smem, T& val, uint tid, const Op& op) blockReduce 72 modules/cudev/include/opencv2/cudev/block/reduce.hpp __device__ __forceinline__ void blockReduce(const tuple<P0, P1, P2, P3, P4, P5, P6, P7, P8, P9>& smem,