Home
last modified time | relevance | path

Searched defs:head_dim (Results 1 – 21 of 21) sorted by relevance

/aosp_15_r20/external/executorch/examples/mediatek/model_export_scripts/
H A Dllama.py165 num_chunks, num_key_value_heads, num_blocks_per_chunk, head_dim, max_cache_size argument
232 head_dim, argument
/aosp_15_r20/external/pytorch/benchmarks/gpt_fast/
H A Dmodel.py26 head_dim: int = 64 variable in ModelArgs
93 self, max_batch_size, max_seq_length, n_heads, head_dim, dtype=torch.bfloat16 argument
H A Dmixtral_moe_model.py26 head_dim: int = 64 variable in ModelArgs
72 self, max_batch_size, max_seq_length, n_heads, head_dim, dtype=torch.bfloat16 argument
/aosp_15_r20/external/pytorch/test/
H A Dtest_flop_counter.py323 head_dim, argument
480 head_dim, argument
H A Dtest_transformers.py1703 def _get_block_size_n(device, head_dim, is_dropout, is_causal): argument
1811 head_dim, argument
1894 head_dim, argument
3326 def rand_nt(sequence_list, num_heads, head_dim): argument
/aosp_15_r20/external/executorch/backends/vulkan/test/op_tests/
H A Dsdpa_test.cpp222 const int head_dim = embedding_dim / num_heads; in test_reference_sdpa() local
292 const int head_dim = embedding_dim / num_heads; in test_vulkan_sdpa() local
H A Drotary_embedding_test.cpp83 const int head_dim = dim / n_heads; in test_reference() local
/aosp_15_r20/external/executorch/examples/mediatek/models/llm_models/weights/Llama-3.2-1B-Instruct/
H A Dconfig.json7 "head_dim": 64, number
/aosp_15_r20/external/executorch/examples/mediatek/models/llm_models/weights/Llama-3.2-3B-Instruct/
H A Dconfig.json7 "head_dim": 128, number
/aosp_15_r20/external/pytorch/benchmarks/transformer/
H A Dsdpa.py40 def head_dim(self) -> int: member in ExperimentConfig
H A Dattention_bias_benchmarks.py39 def head_dim(self) -> int: member in ExperimentConfig
/aosp_15_r20/external/executorch/examples/models/llama/source_transformation/
H A Dquantized_kv_cache.py36 head_dim, argument
H A Dapply_spin_quant_r1_r2.py68 def rotate_ov_proj(layer, head_dim, R2=None): argument
/aosp_15_r20/external/pytorch/torch/csrc/api/include/torch/nn/modules/
H A Dactivation.h864 int64_t head_dim; variable
/aosp_15_r20/external/executorch/extension/llm/custom_ops/
H A Dtest_sdpa_with_kv_cache.py407 head_dim, argument
/aosp_15_r20/external/pytorch/torch/csrc/api/include/torch/nn/functional/
H A Dactivation.h677 const auto head_dim = embed_dim / num_heads; variable
/aosp_15_r20/external/pytorch/aten/src/ATen/native/nested/cuda/
H A DNestedTensorTransformerUtils.cpp174 const int64_t head_dim, in view_as_dense()
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/
H A Dsdp_utils.cpp316 const auto head_dim = params.query.sym_size(3); in check_cudnn_tensor_shapes() local
/aosp_15_r20/external/pytorch/aten/src/ATen/native/transformers/cuda/mem_eff_attention/
H A Dkernel_forward.h158 int32_t head_dim = 0; member
H A Dkernel_backward.h662 int32_t head_dim = -1; member
/aosp_15_r20/external/pytorch/test/inductor/
H A Dtest_aot_inductor.py1444 head_dim, argument