/aosp_15_r20/frameworks/native/opengl/libs/EGL/ |
H A D | BlobCache_test.cpp | 8 ** http://www.apache.org/licenses/LICENSE-2.0 34 BAD_VALUE = -EINVAL, 52 ASSERT_EQ(BlobCache::InsertResult::kInserted, mBC->set("abcd", 4, "efgh", 4)); in TEST_F() 53 ASSERT_EQ(size_t(4), mBC->get("abcd", 4, buf, 4)); in TEST_F() 62 ASSERT_EQ(BlobCache::InsertResult::kInserted, mBC->set("ab", 2, "cd", 2)); in TEST_F() 63 ASSERT_EQ(BlobCache::InsertResult::kInserted, mBC->set("ef", 2, "gh", 2)); in TEST_F() 64 ASSERT_EQ(size_t(2), mBC->get("ab", 2, buf, 2)); in TEST_F() 67 ASSERT_EQ(size_t(2), mBC->get("ef", 2, buf, 2)); in TEST_F() 74 ASSERT_EQ(BlobCache::InsertResult::kInserted, mBC->set("abcd", 4, "efgh", 4)); in TEST_F() 75 ASSERT_EQ(size_t(4), mBC->get("abcd", 4, buf + 1, 4)); in TEST_F() [all …]
|
/aosp_15_r20/packages/modules/NeuralNetworks/driver/cache/BlobCache/ |
D | BlobCache_test.cpp | 8 ** http://www.apache.org/licenses/LICENSE-2.0 36 enum { OK = 0, BAD_VALUE = -EINVAL }; 67 mBC->set("abcd", 4, "efgh", 4); in TEST_P() 68 ASSERT_EQ(size_t(4), mBC->get("abcd", 4, buf, 4)); in TEST_P() 77 mBC->set("ab", 2, "cd", 2); in TEST_P() 78 mBC->set("ef", 2, "gh", 2); in TEST_P() 79 ASSERT_EQ(size_t(2), mBC->get("ab", 2, buf, 2)); in TEST_P() 82 ASSERT_EQ(size_t(2), mBC->get("ef", 2, buf, 2)); in TEST_P() 89 mBC->set("ab", 2, "cd", 2); in TEST_P() 90 mBC->set("ef", 2, "gh", 2); in TEST_P() [all …]
|
/aosp_15_r20/external/arm-neon-tests/ |
H A D | Init.s | 4 ; Cortex-A8 Dhrystone example - Startup Code 26 ; Disable Cortex-A8 MMU if enabled 51 MCR p15, 0, r0, c8, c7, 0 ; Cortex-A8 I-TLB and D-TLB invalidation 54 ; Cache Invalidation code for Cortex-A8 57 ; Invalidate L1 Instruction Cache 60 TST r0, #0x3 ; Harvard Cache? 62 MCRNE p15, 0, r0, c7, c5, 0 ; Invalidate Instruction Cache 68 MOV r3, r3, LSR #23 ; Total cache levels << 1 71 MOV r10, #0 ; R10 holds current cache level << 1 72 Loop1 ADD r2, r10, r10, LSR #1 ; R2 holds cache "Set" position [all …]
|
/aosp_15_r20/external/mesa3d/src/amd/compiler/ |
H A D | README-ISA.md | 8 D.u = abs(S0.i - S1.i) + S2.u. 15 ABS_DIFF (A,B) = (A>B) ? (A-B) : (B-A) 21 `v_sad_u32(-5, 0, 0)` would return `4294967291` (`-5` interpreted as unsigned), 78 > and sent to the texture cache. Any texture or buffer resources and samplers 79 > are also sent immediately. However, write-data is not immediately sent to the 80 > texture cache. 102 ## FLAT, Scratch, Global instructions 118 GFX7-8 ISA manuals are mistaken about the available LDS size. 138 ## RDNA L0, L1 cache and DLC, GLC bits 140 The old L1 cache was renamed to L0, and a new L1 cache was added to RDNA. The [all …]
|
H A D | aco_assembler.cpp | 4 * SPDX-License-Identifier: MIT 38 : program(program_), gfx_level(program->gfx_level), symbols(symbols_) in asm_context() 52 int subvector_begin_pos = -1; 58 unsigned addr_dwords = instr->operands.size() - 3; in get_mimg_nsa_dwords() 60 if (instr->operands[3 + i].physReg() != in get_mimg_nsa_dwords() 61 instr->operands[3 + (i - 1)].physReg().advance(instr->operands[3 + (i - 1)].bytes())) in get_mimg_nsa_dwords() 62 return DIV_ROUND_UP(addr_dwords - 1, 4); in get_mimg_nsa_dwords() 70 switch (instr->opcode) { in get_vopd_opy_start() 112 uint8_t mask = get_gfx11_true16_mask(instr->opcode); in needs_vop3_gfx11() 117 if (instr->operands[i].physReg().reg() >= (256 + 128)) in needs_vop3_gfx11() [all …]
|
H A D | aco_print_ir.cpp | 4 * SPDX-License-Identifier: MIT 113 fprintf(output, "-%d]", r + size - 1); in print_physReg() 126 fprintf(output, "%d", reg - 128); in print_constant() 129 fprintf(output, "%d", 192 - reg); in print_constant() 135 case 241: fprintf(output, "-0.5"); break; in print_constant() 137 case 243: fprintf(output, "-1.0"); break; in print_constant() 139 case 245: fprintf(output, "-2.0"); break; in print_constant() 141 case 247: fprintf(output, "-4.0"); break; in print_constant() 150 print_reg_class(definition->regClass(), output); in print_definition() 151 if (definition->isPrecise()) in print_definition() [all …]
|
/aosp_15_r20/external/mesa3d/src/amd/common/ |
H A D | amd_kernel_code_t.h | 4 * SPDX-License-Identifier: MIT 10 //---------------------------------------------------------------------------// 12 //---------------------------------------------------------------------------// 48 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER_WIDTH) - 1) 54 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_PTR_WIDTH) - 1) 60 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR_WIDTH) - 1) 66 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_KERNARG_SEGMENT_PTR_WIDTH) - 1) 72 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_ID_WIDTH) - 1) 78 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_FLAT_SCRATCH_INIT_WIDTH) - 1) 84 ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_PRIVATE_SEGMENT_SIZE_WIDTH) - 1) [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/core/kernels/ |
H A D | deep_conv2d.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 57 // Element-wise products (each product is a MatMul across depth). in GetDeepConvCost() 66 const int64_t row_tiles = (out_rows + out_tile_rows - 1) / out_tile_rows; in GetDeepConvCost() 67 const int64_t col_tiles = (out_cols + out_tile_cols - 1) / out_tile_cols; in GetDeepConvCost() 208 const int64_t base_filter_rows = transform->filter_shape().rows; in operator ()() 209 const int64_t base_filter_cols = transform->filter_shape().cols; in operator ()() 212 const int64_t tile_rows = transform->input_shape().rows; in operator ()() 213 const int64_t tile_cols = transform->input_shape().cols; in operator ()() 266 // 'filter_in' into 'filter_buf', adding zero-padding as needed. 294 const int64_t num_filters = od_limit - od_start; in operator ()() [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/core/kernels/mkl/ |
H A D | mkl_conv_ops.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 100 return context_.fwd_pd->scratchpad_desc(); in GetScratchPadDesc() 121 // When we are using single global cache then in this case we can have in Execute() 127 // TODO(intel-tf): Create a common function and avoid the duplicate code in Execute() 128 context_.src_mem->set_data_handle( in Execute() 130 context_.filter_mem->set_data_handle( in Execute() 133 context_.bias_mem->set_data_handle( in Execute() 137 context_.bn_scale_mem->set_data_handle( in Execute() 139 context_.bn_mean_mem->set_data_handle( in Execute() 141 context_.bn_rsqrt_mem->set_data_handle( in Execute() [all …]
|
H A D | mkl_qmatmul_op.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 16 // Implements a quantized eight-bit version of the matmul operation with bias, 19 // - Input: quantized as uint8 via either MIN_FIRST or SCALE mode. 20 // SCALE mode is selected when input is guaranteed to be non- 23 // - Weight: quantized to int8 via SCALE mode. 24 // - Bias: float32/int32. For int32, it is quantized according to input and 25 // filter min-max values. 35 // With SCALE quantization (used for non-negative Af32), Qa and Au8 can be 40 // Q'a = 255.0 / (Max(Af32) - Min(Af32)) 41 // A'u8 = round(Q'a * (Af32 - Min(Af32) * ones(Af32))), [all …]
|
/aosp_15_r20/out/soong/ |
D | build.aosp_shiba.4.ninja | 2 # Module: artd-aidl-rust 3 # Variant: android_arm64_armv8-2a_cortex-a55_source 9 m.artd-aidl-rust_android_arm64_armv8-2a_cortex-a55_source.moduleDesc = //art/artd/binder:artd-aidl-… 10 m.artd-aidl-rust_android_arm64_armv8-2a_cortex-a55_source.moduleDescSuffix = 13 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust/android_arm64_armv8-2a_cortex-a55_source/a… 15 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust-source/gen/com/android/server/art/ArtConst… 16 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust-source/gen/com/android/server/art/ArtdDexo… 17 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust-source/gen/com/android/server/art/Artifact… 18 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust-source/gen/com/android/server/art/Artifact… 19 …out/soong/.intermediates/art/artd/binder/artd-aidl-rust-source/gen/com/android/server/art/CopyAndR… [all …]
|
/aosp_15_r20/external/swiftshader/third_party/llvm-10.0/llvm/lib/Target/AMDGPU/ |
H A D | AMDKernelCodeT.h | 1 //===-- AMDGPUKernelCodeT.h - Print AMDGPU assembly code ---------*- C++ -*-===// 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 7 //===----------------------------------------------------------------------===// 9 //===----------------------------------------------------------------------===// 20 //---------------------------------------------------------------------------// 22 //---------------------------------------------------------------------------// 91 …BUFFER = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER_WIDTH) - 1) << AMD_CODE_PROPE… 95 …GPR_DISPATCH_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_PTR_WIDTH) - 1) << AMD_CODE_PROPE… 99 …AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR_WIDTH) - … 103 …GMENT_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_KERNARG_SEGMENT_PTR_WIDTH) - 1) << AMD_CODE_PROPE… [all …]
|
/aosp_15_r20/external/swiftshader/third_party/llvm-16.0/llvm/lib/Target/AMDGPU/ |
H A D | AMDKernelCodeT.h | 1 //===-- AMDGPUKernelCodeT.h - Print AMDGPU assembly code ---------*- C++ -*-===// 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 7 //===----------------------------------------------------------------------===// 9 //===----------------------------------------------------------------------===// 16 //---------------------------------------------------------------------------// 18 //---------------------------------------------------------------------------// 87 …BUFFER = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER_WIDTH) - 1) << AMD_CODE_PROPE… 91 …GPR_DISPATCH_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_PTR_WIDTH) - 1) << AMD_CODE_PROPE… 95 …AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR_WIDTH) - … 99 …GMENT_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_KERNARG_SEGMENT_PTR_WIDTH) - 1) << AMD_CODE_PROPE… [all …]
|
H A D | SIInstrFormats.td | 1 //===-- SIInstrFormats.td - SI Instruction Encodings ----------------------===// 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 7 //===----------------------------------------------------------------------===// 11 //===----------------------------------------------------------------------===// 16 // Low bits - basic encoding information. 44 field bit FLAT = 0; 57 // High bits - other information. 70 // Most sopk treat the immediate as a signed 16-bit, however some 74 // This is an s_store_dword* instruction that requires a cache flush 76 // SMEM instructions like the cache flush ones. [all …]
|
/aosp_15_r20/external/llvm/lib/Target/AMDGPU/ |
H A D | AMDKernelCodeT.h | 1 //===-- AMDGPUKernelCodeT.h - Print AMDGPU assembly code ---------*- C++ -*-===// 8 //===----------------------------------------------------------------------===// 10 //===----------------------------------------------------------------------===// 21 //---------------------------------------------------------------------------// 23 //---------------------------------------------------------------------------// 92 …BUFFER = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_PRIVATE_SEGMENT_BUFFER_WIDTH) - 1) << AMD_CODE_PROPE… 96 …GPR_DISPATCH_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_PTR_WIDTH) - 1) << AMD_CODE_PROPE… 100 …AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_QUEUE_PTR_WIDTH) - … 104 …GMENT_PTR = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_KERNARG_SEGMENT_PTR_WIDTH) - 1) << AMD_CODE_PROPE… 108 …_SGPR_DISPATCH_ID = ((1 << AMD_CODE_PROPERTY_ENABLE_SGPR_DISPATCH_ID_WIDTH) - 1) << AMD_CODE_PROPE… [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/core/util/ |
H A D | mkl_util.h | 7 http://www.apache.org/licenses/LICENSE-2.0 152 // distinguish between blocked and non-blocked formats, we have defined a new 155 // 1) FORMAT_BLOCKED: as described above, this is needed for element-wise 157 // 2) FORMAT_INVALID: for error-checking (ex. unsupported format) 160 // FORMAT_X - 1D tensor 161 // FORMAT_NC - 2D tensor 162 // FORMAT_TNC - 3D tensor 264 #define INVALID_DIM_SIZE -1 270 data_.sizes_[i] = -1; 273 data_.map_[i] = -1; [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/lite/kernels/internal/ |
H A D | types.h | 7 http://www.apache.org/licenses/LICENSE-2.0 61 // This enumeration allows for non-default formats for the weights array 62 // of a fully-connected operator, allowing the use of special optimized 65 // Default format (flat 2D layout, the inner contiguous dimension 66 // is input_depth, the outer non-contiguous dimension is output_depth) 70 // 8-bit quantized layers. 72 // The use case we're concerned with here is: 8-bit quantization, 73 // large weights matrix that doesn't fit in cache (e.g. 4096x2048 in 74 // a key application that drove this), very small batch size (e.g. 1 -- 4). 76 // Even with 8-bit quantization of weights, the performance of memory [all …]
|
/aosp_15_r20/external/mesa3d/src/amd/compiler/tests/ |
H A D | test_assembler.cpp | 4 * SPDX-License-Identifier: MIT 6 #include <llvm/Config/llvm-config.h> 29 //~gfx[6-7]>> c7800000 30 //~gfx[6-7]! bf810000 31 //~gfx[8-9]>> s_memtime s[0:1] ; c0900000 00000000 51 bld.reset(program->create_and_insert_block()); 53 program->blocks[1].linear_preds.push_back(0u); 70 bld.reset(program->create_and_insert_block()); 79 bld.reset(program->create_and_insert_block()); 81 program->blocks[2].linear_preds.push_back(0u); [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/python/eager/ |
H A D | function.py | 7 # http://www.apache.org/licenses/LICENSE-2.0 15 # pylint: disable=unidiomatic-typecheck 16 """Defun decorator for defining graph-mode functions.""" 74 # tf.function->autograph->->dataset->tf.function). 104 return x._type_spec # pylint: disable=protected-access 196 next_func = g._get_function(func_tag.name) # pylint: disable=protected-access 201 exc._message = error_interpolation.interpolate(message, g) # pylint: disable=protected-access 216 - `function`: _EagerDefinedFunction being created before finalizing the graph. 218 - `name`: name of the function. 219 - `graph`: Graph of the function. [all …]
|
/aosp_15_r20/prebuilts/gcc/linux-x86/host/x86_64-w64-mingw32-4.8/share/man/man1/ |
D | x86_64-w64-mingw32-gprof.1 | 18 .\" Set up some character translations and predefined strings. \*(-- will 24 .tr \(*W- 27 . ds -- \(*W- 29 . if (\n(.H=4u)&(1m=24u) .ds -- \(*W\h'-12u'\(*W\h'-12u'-\" diablo 10 pitch 30 . if (\n(.H=4u)&(1m=20u) .ds -- \(*W\h'-12u'\(*W\h'-8u'-\" diablo 12 pitch 37 . ds -- \|\(em\| 73 .\" Fear. Run. Save yourself. No user-serviceable parts. 83 . ds #H ((1u-(\\\\n(.fu%2u))*.13m) 99 . ds ' \\k:\h'-(\\n(.wu*8/10-\*(#H)'\'\h"|\\n:u" 100 . ds ` \\k:\h'-(\\n(.wu*8/10-\*(#H)'\`\h'|\\n:u' [all …]
|
/aosp_15_r20/external/mesa3d/docs/drivers/ |
H A D | asahi.rst | 7 ----------------- 12 reverse-engineering the hardware, as glue to get at the "interesting" GPU 15 The library is only built if ``-Dtools=asahi`` is passed. It builds a single 24 ----------------- 36 ``st_var`` instruction. ``st_var`` takes a *vertex output index* and a 32-bit 39 consist of a single 32-bit value or an aligned 16-bit register pair, depending 40 on whether interpolation should happen at 32-bit or 16-bit. Vertex outputs are 42 32-bit user varyings coming next with perspective, flat, and linear interpolated 43 varyings grouped in that order, then 16-bit user varyings with the same groupings, 51 .. list-table:: Ordering of vertex outputs with all outputs used [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/compiler/tf2tensorrt/kernels/ |
H A D | trt_engine_op.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 66 LOG_FIRST_N(WARNING, 5) << "TF-TRT Warning: " 80 device_memory_allocator_->free(device_memory_); in ~ContextDeviceMemory() 92 device_memory_ = device_memory_allocator_->allocate( in AllocateDeviceMemory() 103 execution_context_->setDeviceMemory(device_memory_); in AllocateDeviceMemory() 192 // engine fails, enters a dummy entry into the cache_resource cache so we 255 // user-provided quantization ranges. 280 return (void*)X->flat<EnumToDataType<dt>::Type>().data(); \ 284 auto tensor_type = tensor_ptr->dtype(); in GetTensorAddress() 301 flib_runtime->GetFunctionLibraryDefinition(); in FunctionDefToGraphDef() [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/dtensor/cc/ |
H A D | dtensor_tpu_kernels.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 57 Status status = resource_manager->Delete<ResourceT>( in DeleteIfExists() 58 resource_manager->default_container(), resource_name); in DeleteIfExists() 89 OP_REQUIRES_OK(ctx, tpu_system->Initialize(ctx, rmgr, retry_timeout, in Compute() 105 ctx->allocate_output( in Compute() 109 ctx_output->flat<int32>()(i) = core_id_output_vec[i]; in Compute() 133 // Create the subgraph compilation cache and put it in the local resource in InitializeInternal() 150 while (!tpu_platform->Initialized() && in InitializeInternal() 151 (absl::Now() - start < retry_timeout)) { in InitializeInternal() 153 init_status = tpu_platform->Initialize({}); in InitializeInternal() [all …]
|
/aosp_15_r20/prebuilts/go/linux-x86/src/cmd/vendor/github.com/google/pprof/internal/report/ |
D | source.go | 7 // http://www.apache.org/licenses/LICENSE-2.0 108 fmt.Fprintf(w, "%10s %10s (flat, cum) %s of Total\n", 118 …fmt.Fprintf(w, "%10s %10s %6d:%s\n", valueOrDot(fn.Flat, rpt), valueOrDot(fn.Cum, rpt), fn.Info.Li… 145 loc *profile.Location // Always non-nil 154 file string // For top-level function in which instruction occurs 155 line int // For top-level function in which instruction occurs 156 flat, cum int64 // Samples to report (divisor already applied) member 163 flat int64 member 171 stack []callID // Inlined call-stack 179 flat, cum int64 member [all …]
|
/aosp_15_r20/external/tensorflow/tensorflow/compiler/jit/kernels/ |
H A D | xla_ops.cc | 7 http://www.apache.org/licenses/LICENSE-2.0 57 (CTX)->CtxFailureWithWarning(__FILE__, __LINE__, _s); \ 133 XlaExecutableClosure value = std::move(it->second); in Consume() 153 return ctx->op_device_context() ? ctx->op_device_context()->stream() in GetStream() 161 int device_ordinal = stream ? stream->parent()->device_ordinal() in GetLaunchContext() 162 : client->default_device_ordinal(); in GetLaunchContext() 178 auto start_time = env->NowMicros(); in RunExecutable() 183 run_options.set_intra_op_thread_pool(&ctx->eigen_cpu_device()); in RunExecutable() 190 executable->Run(std::move(execution_inputs), run_options); in RunExecutable() 193 executable->RunAsync(std::move(execution_inputs), run_options); in RunExecutable() [all …]
|