Searched defs:numelPerThread (Results 1 – 1 of 1) sorted by relevance
146 const size_t numelPerThread = kBytesPerThread / sizeof(at::BFloat16); in oneShotAllReduceKernel() local211 const size_t numelPerThread = kBytesPerThread / sizeof(at::BFloat16); in twoShotAllReduceKernel() local369 const size_t numelPerThread = kBytesPerThread / sizeof(at::BFloat16); in hybridCubeMeshAllReduceKernel() local469 const auto numelPerThread = kBytesPerThread / elemSize; in getLaunchConfig() local