Home
last modified time | relevance | path

Searched refs:ThreadMap (Results 1 – 25 of 85) sorted by relevance

1234

/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/iterators/
H A Depilogue_predicated_tile_iterator.h77 using ThreadMap = ThreadMap_;
78 using Shape = typename ThreadMap::Shape;
90 static int const kElementsPerAccess = ThreadMap::kElementsPerAccess;
91 static int const kThreads = ThreadMap::kThreads;
92 static int const kIterations = ThreadMap::Count::kTile;
95 ThreadMap::Iterations::kRow > 0,
98 ThreadMap::Iterations::kGroup > 0,
101 ThreadMap::Iterations::kCluster > 0,
104 ThreadMap::Iterations::kColumn > 0,
110 ThreadMap::Iterations::kColumn * ThreadMap::Iterations::kRow *
[all …]
H A Dpredicated_tile_iterator_residual_last.h148 typename ThreadMap,
149 int AccessSize = ThreadMap::kElementsPerAccess,
187 using ThreadMap = ThreadMap_; variable
211 ThreadMap,
220 ThreadMap::Iterations::kCount * ThreadMap::kElementsPerAccess>;
376 for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) { in load_with_byte_offset()
378 for (int c = 0; c < ThreadMap::Iterations::kContiguous; ++c) { in load_with_byte_offset()
382 kAccessesPerVector * (c + s * ThreadMap::Iterations::kContiguous); in load_with_byte_offset()
421 for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) { in store_with_byte_offset()
423 for (int c = 0; c < ThreadMap::Iterations::kContiguous; ++c) { in store_with_byte_offset()
[all …]
H A Dpredicated_tile_access_iterator_residual_last.h76 typename ThreadMap,
111 using ThreadMap = ThreadMap_; variable
129 ThreadMap,
133 ThreadMap::kElementsPerAccess / AccessType::kElements;
136 !(ThreadMap::kElementsPerAccess % AccessType::kElements),
159 ThreadMap>()()) {} in Params()
326 (ThreadMap::Delta::kContiguous * sizeof_bits<Element>::value / in get()
330 the_predicates.iteration_strided_ * ThreadMap::Delta::kStrided; in get()
342 (ThreadMap::Delta::kContiguous * in get()
362 ThreadMap::Iterations::kContiguous) {
[all …]
H A Dmake_residual_last.h26 typename ThreadMap,
34 ThreadMap,
42 ThreadMap,
52 typename ThreadMap,
60 ThreadMap,
68 ThreadMap,
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/epilogue/
H A Depilogue_pipelined.h594 using ThreadMap = typename OutputTileIterator::ThreadMap;
597 for (int cluster = 0; cluster < ThreadMap::Iterations::kCluster;
600 for (int group = 0; group < ThreadMap::Iterations::kGroup; ++group) {
602 for (int row = 0; row < ThreadMap::Iterations::kRow; ++row) {
603 int row_offset = row * ThreadMap::Delta::kRow +
604 group * ThreadMap::Delta::kGroup +
605 cluster * ThreadMap::Delta::kCluster;
608 ThreadMap::Iterations::kRow *
609 (group + ThreadMap::Iterations::kGroup * cluster));
611 for (int column = 0; column < ThreadMap::Iterations::kColumn;
[all …]
/aosp_15_r20/external/webrtc/modules/remote_bitrate_estimator/test/
H A Dbwe_test_logging.cc85 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in Log()
122 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in Plot()
136 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PlotBar()
149 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PlotBaselineBar()
165 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PlotErrorBar()
184 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PlotLimitErrorBar()
199 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PlotLabel()
246 ThreadMap::iterator it = thread_map_.find(rtc::CurrentThreadId()); in PopState()
H A Dbwe_test_logging.h339 typedef std::map<uint32_t, ThreadState> ThreadMap; typedef
353 ThreadMap thread_map_;
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/transform/
H A Dtile_smem_loader.h30 using ThreadMap = cutlass::transform::PitchLinearStripminedThreadMap< variable
43 ThreadMap>; // ThreadMap
50 ThreadMap>; // ThreadMap
/aosp_15_r20/external/pytorch/aten/src/ATen/native/cuda/cutlass_extensions/gemm/threadblock/
H A Ddq_mma_multistage.h161 static int const AsyncCopyIterationsPerStageA = IteratorA::ThreadMap::Iterations::kCount;
164 static int const AsyncCopyIterationsPerStageB = IteratorB::ThreadMap::Iterations::kCount;
257 … * IteratorA::ThreadMap::kElementsPerAccess / IteratorA::kAccessesPerVector / 8;
288 … * IteratorB::ThreadMap::kElementsPerAccess / IteratorB::kAccessesPerVector / 8;
359 … * IteratorA::ThreadMap::kElementsPerAccess / IteratorA::kAccessesPerVector in operator()
385 … * IteratorB::ThreadMap::kElementsPerAccess / IteratorB::kAccessesPerVector in operator()
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/gemm/
H A Dcustom_mma_multistage.h146 IteratorA::ThreadMap::Iterations::kCount;
150 IteratorB::ThreadMap::Iterations::kCount;
310 IteratorA::ThreadMap::kElementsPerAccess /
346 IteratorB::ThreadMap::kElementsPerAccess /
397 IteratorA::ThreadMap::kElementsPerAccess / in _prologue()
427 IteratorB::ThreadMap::kElementsPerAccess / in _prologue()
H A Dmma_from_smem.h795 IteratorB1::ThreadMap::Iterations::kCount;
945 IteratorB1::ThreadMap::kElementsPerAccess /
988 IteratorB1::ThreadMap::kElementsPerAccess / in _prologue()
/aosp_15_r20/external/perfetto/ui/src/plugins/dev.perfetto.Thread/
H A Dindex.ts17 import {ThreadDesc, ThreadMap} from '../dev.perfetto.Thread/threads';
58 private threads?: ThreadMap;
H A Dthreads.ts24 export type ThreadMap = ReadonlyMap<number, ThreadDesc>; alias
/aosp_15_r20/external/perfetto/ui/src/plugins/org.kernel.SuspendResumeLatency/
H A Dindex.ts24 import {ThreadMap} from '../dev.perfetto.Thread/threads';
37 private readonly threads: ThreadMap,
H A Dsuspend_resume_details.ts29 import {ThreadMap} from '../dev.perfetto.Thread/threads';
48 private readonly threads: ThreadMap,
/aosp_15_r20/external/perfetto/ui/src/plugins/dev.perfetto.CpuSlices/
H A Dsched_details_tab.ts36 import {ThreadDesc, ThreadMap} from '../dev.perfetto.Thread/threads';
62 private readonly threads: ThreadMap,
H A Dcpu_slice_track.ts41 import {ThreadMap} from '../dev.perfetto.Thread/threads';
73 private readonly threads: ThreadMap,
/aosp_15_r20/external/perfetto/ui/src/plugins/dev.perfetto.ProcessSummary/
H A Dprocess_scheduling_track.ts31 import {ThreadMap} from '../dev.perfetto.Thread/threads';
66 private readonly threads: ThreadMap,
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/
H A Dkernel_forward.h501 typename DefaultEpilogue::OutputTileIterator::ThreadMap,
505 typename DefaultEpilogue::OutputTileIterator::ThreadMap,
/aosp_15_r20/out/soong/.intermediates/prebuilts/sdk/current/androidx/m2repository/androidx/compose/runtime/runtime-android/1.8.0-beta01/androidx.compose.runtime_runtime/android_common_apex30/aar/
Dbaseline-prof.txt101 HSPLandroidx/compose/runtime/internal/ThreadMap;->**(**)**
Dclasses.jarMETA-INF/ androidx/ androidx/compose/ androidx/compose/runtime/ androidx/compose ...
/aosp_15_r20/out/soong/.intermediates/prebuilts/sdk/current/androidx/m2repository/androidx/compose/runtime/runtime-android/1.8.0-beta01/androidx.compose.runtime_runtime/android_common/aar/
Dbaseline-prof.txt101 HSPLandroidx/compose/runtime/internal/ThreadMap;->**(**)**
Dandroidx.compose.runtime_runtime.jarMETA-INF/ androidx/ androidx/compose/ androidx/compose/runtime/ androidx/compose ...
/aosp_15_r20/out/soong/.intermediates/prebuilts/sdk/current/androidx/m2repository/androidx/compose/runtime/runtime-android/1.8.0-beta01/androidx.compose.runtime_runtime/android_common_apex34/aar/
Dbaseline-prof.txt101 HSPLandroidx/compose/runtime/internal/ThreadMap;->**(**)**
Dclasses.jarMETA-INF/ androidx/ androidx/compose/ androidx/compose/runtime/ androidx/compose ...

1234