Searched defs:elements_per_thread (Results 1 – 2 of 2) sorted by relevance
57 constexpr unsigned int elements_per_thread = 8; in getCatGridRocm() local82 unsigned int elements_per_thread = ALIGNED_VEC_LOAD_BYTES / sizeof(T) * in getCatGridContig() local
119 constexpr int elements_per_thread = sizeof(scalar_t) < 8 ? 8 / sizeof(scalar_t) : 1; in triu_tril_cuda_template() local