Searched refs:kCUDABlockReduceMaxThreads (Results 1 – 4 of 4) sorted by relevance
17 constexpr int kCUDABlockReduceMaxThreads = C10_WARP_SIZE * C10_WARP_SIZE; variable
210 num_threads <= cuda_utils::kCUDABlockReduceMaxThreads, ""); in handle_fused_mode()
372 num_threads() <= cuda_utils::kCUDABlockReduceMaxThreads, in embedding_renorm_cuda_()
89 props->maxThreadsPerBlock, cuda_utils::kCUDABlockReduceMaxThreads); in renormRows()