xref: /aosp_15_r20/external/executorch/kernels/quantized/quantized.yaml (revision 523fa7a60841cd1ecfb9cc4201f1ca8b03ed023a)
1*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::add.out(Tensor a, float a_scale, int a_zero_point, int a_quant_min, int a_quant_max, Tensor b, float b_scale, int b_zero_point, int b_quant_min, int b_quant_max, float out_scale, int out_zero_point, int out_quant_min, int out_quant_max, *, Tensor(a!) out) -> Tensor(a!)
2*523fa7a6SAndroid Build Coastguard Worker  variants: function
3*523fa7a6SAndroid Build Coastguard Worker  kernels:
4*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
5*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_add_out
6*523fa7a6SAndroid Build Coastguard Worker
7*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::choose_qparams.Tensor_out(Tensor input, int quant_min, int quant_max, float eps, ScalarType dtype, *, Tensor(a!) scale_out, Tensor(b!) zero_point_out) -> (Tensor(a!), Tensor(b!))
8*523fa7a6SAndroid Build Coastguard Worker  variants: function
9*523fa7a6SAndroid Build Coastguard Worker  kernels:
10*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
11*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::choose_qparams_tensor_out
12*523fa7a6SAndroid Build Coastguard Worker
13*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::dequantize_per_tensor.out(Tensor input, float scale, int zero_point, int quant_min, int quant_max, ScalarType dtype, *, ScalarType? out_dtype=None, Tensor(a!) out) -> Tensor(a!)
14*523fa7a6SAndroid Build Coastguard Worker  variants: function
15*523fa7a6SAndroid Build Coastguard Worker  kernels:
16*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
17*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::dequantize_per_tensor_out
18*523fa7a6SAndroid Build Coastguard Worker
19*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::dequantize_per_tensor.Tensor_out(Tensor input, Tensor scale, Tensor zero_point, int quant_min, int quant_max, ScalarType dtype, *, ScalarType? out_dtype=None, Tensor(a!) out) -> Tensor(a!)
20*523fa7a6SAndroid Build Coastguard Worker  variants: function
21*523fa7a6SAndroid Build Coastguard Worker  kernels:
22*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
23*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::dequantize_per_tensor_tensor_args_out
24*523fa7a6SAndroid Build Coastguard Worker
25*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::quantize_per_channel.out(Tensor input, Tensor scales, Tensor zero_points, int axis, int quant_min, int quant_max, ScalarType dtype, *, Tensor(a!) out) -> Tensor(a!)
26*523fa7a6SAndroid Build Coastguard Worker  variants: function
27*523fa7a6SAndroid Build Coastguard Worker  kernels:
28*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
29*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantize_per_channel_out
30*523fa7a6SAndroid Build Coastguard Worker
31*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::dequantize_per_channel.out(Tensor input, Tensor scales, Tensor? zero_points, int axis, int quant_min, int quant_max, ScalarType dtype, *, ScalarType? out_dtype=None, Tensor(a!) out) -> Tensor(a!)
32*523fa7a6SAndroid Build Coastguard Worker  variants: function
33*523fa7a6SAndroid Build Coastguard Worker  kernels:
34*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
35*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::dequantize_per_channel_out
36*523fa7a6SAndroid Build Coastguard Worker
37*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_byte.out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, *, Tensor(a!) out) -> Tensor(a!)
38*523fa7a6SAndroid Build Coastguard Worker  variants: function
39*523fa7a6SAndroid Build Coastguard Worker  kernels:
40*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
41*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_byte_out
42*523fa7a6SAndroid Build Coastguard Worker
43*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_byte.dtype_out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, *, ScalarType? dtype=None, Tensor(a!) out) -> Tensor(a!)
44*523fa7a6SAndroid Build Coastguard Worker  variants: function
45*523fa7a6SAndroid Build Coastguard Worker  kernels:
46*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
47*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_byte_dtype_out
48*523fa7a6SAndroid Build Coastguard Worker
49*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_2bit.out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, *, Tensor(a!) out) -> Tensor(a!)
50*523fa7a6SAndroid Build Coastguard Worker  variants: function
51*523fa7a6SAndroid Build Coastguard Worker  kernels:
52*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
53*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_2bit_out
54*523fa7a6SAndroid Build Coastguard Worker
55*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_2bit.dtype_out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, ScalarType? dtype=None, *, Tensor(a!) out) -> Tensor(a!)
56*523fa7a6SAndroid Build Coastguard Worker  variants: function
57*523fa7a6SAndroid Build Coastguard Worker  kernels:
58*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
59*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_2bit_dtype_out
60*523fa7a6SAndroid Build Coastguard Worker
61*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_4bit.out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, *, Tensor(a!) out) -> Tensor(a!)
62*523fa7a6SAndroid Build Coastguard Worker  variants: function
63*523fa7a6SAndroid Build Coastguard Worker  kernels:
64*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
65*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_4bit_out
66*523fa7a6SAndroid Build Coastguard Worker
67*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::embedding_4bit.dtype_out(Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, int weight_quant_min, int weight_quant_max, Tensor indices, ScalarType? dtype=None, *, Tensor(a!) out) -> Tensor(a!)
68*523fa7a6SAndroid Build Coastguard Worker  variants: function
69*523fa7a6SAndroid Build Coastguard Worker  kernels:
70*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
71*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_embedding_4bit_dtype_out
72*523fa7a6SAndroid Build Coastguard Worker
73*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::mixed_mm.out(Tensor input, Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, *, Tensor(a!) out) -> Tensor(a!)
74*523fa7a6SAndroid Build Coastguard Worker  variants: function
75*523fa7a6SAndroid Build Coastguard Worker  kernels:
76*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
77*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_mixed_mm_out
78*523fa7a6SAndroid Build Coastguard Worker
79*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::mixed_linear.out(Tensor input, Tensor weight, Tensor weight_scales, Tensor? weight_zero_points, ScalarType? dtype=None, *, Tensor(a!) out) -> Tensor(a!)
80*523fa7a6SAndroid Build Coastguard Worker  variants: function
81*523fa7a6SAndroid Build Coastguard Worker  kernels:
82*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
83*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantized_mixed_linear_out
84*523fa7a6SAndroid Build Coastguard Worker
85*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::quantize_per_tensor.out(Tensor input, float scale, int zero_point, int quant_min, int quant_max, ScalarType dtype, *, Tensor(a!) out) -> Tensor(a!)
86*523fa7a6SAndroid Build Coastguard Worker  variants: function
87*523fa7a6SAndroid Build Coastguard Worker  kernels:
88*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
89*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantize_per_tensor_out
90*523fa7a6SAndroid Build Coastguard Worker
91*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::quantize_per_tensor.Tensor_out(Tensor input, Tensor scale, Tensor zero_point, int quant_min, int quant_max, ScalarType dtype, *, Tensor(a!) out) -> Tensor(a!)
92*523fa7a6SAndroid Build Coastguard Worker  variants: function
93*523fa7a6SAndroid Build Coastguard Worker  kernels:
94*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
95*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantize_per_tensor_tensor_args_out
96*523fa7a6SAndroid Build Coastguard Worker
97*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::choose_qparams_per_token_asymmetric.out(Tensor input, ScalarType dtype, *, Tensor(a!) scale_out, Tensor(b!) zero_point_out) -> (Tensor(a!), Tensor(b!))
98*523fa7a6SAndroid Build Coastguard Worker  variants: function
99*523fa7a6SAndroid Build Coastguard Worker  kernels:
100*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
101*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::choose_qparams_per_token_asymmetric_out
102*523fa7a6SAndroid Build Coastguard Worker
103*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::quantize_per_token.out(Tensor input, Tensor scales, Tensor zero_points, int quant_min, int quant_max, ScalarType dtype, *, Tensor(a!) out) -> Tensor(a!)
104*523fa7a6SAndroid Build Coastguard Worker  variants: function
105*523fa7a6SAndroid Build Coastguard Worker  kernels:
106*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
107*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::quantize_per_token_out
108*523fa7a6SAndroid Build Coastguard Worker
109*523fa7a6SAndroid Build Coastguard Worker- func: quantized_decomposed::dequantize_per_token.out(Tensor input, Tensor scales, Tensor zero_points, int quant_min, int quant_max, ScalarType dtype, ScalarType output_dtype, *, Tensor(a!) out) -> Tensor(a!)
110*523fa7a6SAndroid Build Coastguard Worker  variants: function
111*523fa7a6SAndroid Build Coastguard Worker  kernels:
112*523fa7a6SAndroid Build Coastguard Worker    - arg_meta: null
113*523fa7a6SAndroid Build Coastguard Worker      kernel_name: torch::executor::dequantize_per_token_out
114