Coverage for src/flag_gems/runtime/backend/_arm/__init__.py: 0%
4 statements
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-10 07:09 +0800
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-10 07:09 +0800
1from backend_utils import VendorInfoBase # noqa: E402
3vendor_info = VendorInfoBase(vendor_name="arm", device_name="cpu", device_query_cmd="")
5# Ops listed here are excluded from the ARM customized registry.
6# Auto-generated from upstream _FULL_CONFIG (456 funcs) - _arm/ops/__all__ (63 funcs)
7# Principle: only register _arm impls we've validated to beat ATen native.
8# All other entries from _FULL_CONFIG fall through to PyTorch ATen on ARM CPU.
9CUSTOMIZED_UNUSED_OPS = (
10 "_assert_async",
11 "_conv_depthwise2d",
12 "_index_put_impl_",
13 "_is_all_true",
14 "_safe_softmax",
15 "_unique2",
16 "_upsample_bicubic2d_aa",
17 "_upsample_bicubic2d_aa_backward",
18 "_upsample_nearest_exact1d",
19 "abs",
20 "abs_",
21 "absolute",
22 "acos",
23 "addcdiv",
24 "addcdiv_out",
25 "addcmul",
26 "addcmul_out",
27 "addmm_dtype",
28 "addmm_dtype_out",
29 "addmv",
30 "addmv_out",
31 "addr",
32 "affine_grid_generator",
33 "alias_copy",
34 "all_dim",
35 "all_dims",
36 "allclose",
37 "amax",
38 "aminmax",
39 "angle",
40 "any_dim",
41 "any_dims",
42 "arange_start",
43 "arcsinh",
44 "arcsinh_",
45 "arcsinh_out",
46 "arctanh_",
47 "argmin",
48 "asinh",
49 "asinh_",
50 "asinh_out",
51 "atan",
52 "atan2",
53 "atan2_out",
54 "atan_",
55 "avg_pool2d",
56 "avg_pool2d_backward",
57 "avg_pool3d",
58 "avg_pool3d_backward",
59 "baddbmm",
60 "batch_norm",
61 "batch_norm_backward",
62 "bernoulli_",
63 "bincount",
64 "bitwise_and_scalar",
65 "bitwise_and_scalar_",
66 "bitwise_and_scalar_tensor",
67 "bitwise_and_tensor",
68 "bitwise_and_tensor_",
69 "bitwise_left_shift",
70 "bitwise_not",
71 "bitwise_not_",
72 "bitwise_or_scalar",
73 "bitwise_or_scalar_",
74 "bitwise_or_scalar_tensor",
75 "bitwise_or_tensor",
76 "bitwise_or_tensor_",
77 "bitwise_right_shift",
78 "bmm_out",
79 "cat_out",
80 "ceil",
81 "ceil_",
82 "ceil_out",
83 "celu",
84 "celu_",
85 "clamp",
86 "clamp_",
87 "clamp_min",
88 "clamp_min_",
89 "clamp_tensor",
90 "clamp_tensor_",
91 "clip",
92 "clip_",
93 "col2im",
94 "concatenate",
95 "conj_physical",
96 "constant_pad_nd",
97 "conv1d",
98 "conv2d",
99 "conv3d",
100 "conv_transpose1d",
101 "copysign",
102 "copysign_out",
103 "cos_",
104 "cosh",
105 "cosh_",
106 "cosh_out",
107 "count_nonzero",
108 "ctc_loss",
109 "cudnn_convolution",
110 "cummax",
111 "cummin",
112 "cumprod",
113 "cumprod_",
114 "cumsum_out",
115 "diag",
116 "diag_embed",
117 "diagonal_backward",
118 "diff",
119 "digamma_",
120 "dot",
121 "dropout",
122 "dropout_backward",
123 "elu",
124 "elu_",
125 "elu_backward",
126 "embedding_backward",
127 "embedding_dense_backward",
128 "eq",
129 "eq_scalar",
130 "equal",
131 "erf",
132 "erf_",
133 "exp",
134 "exp2",
135 "exp2_",
136 "exp_",
137 "exp_out",
138 "expm1",
139 "expm1_",
140 "expm1_out",
141 "eye",
142 "eye_m",
143 "feature_dropout",
144 "feature_dropout_",
145 "fill_scalar",
146 "fill_scalar_",
147 "fill_scalar_out",
148 "fill_tensor",
149 "fill_tensor_",
150 "fill_tensor_out",
151 "flash_attention_forward",
152 "flip",
153 "floor_",
154 "fmin",
155 "fmin_out",
156 "fmod_scalar",
157 "fmod_scalar_",
158 "fmod_tensor",
159 "fmod_tensor_",
160 "full_like",
161 "gather_backward",
162 "gcd",
163 "gcd_out",
164 "ge",
165 "ge_scalar",
166 "gelu_",
167 "gelu_backward",
168 "glu",
169 "glu_backward",
170 "greater",
171 "greater_out",
172 "greater_scalar",
173 "greater_scalar_out",
174 "grid_sample",
175 "group_mm",
176 "group_norm",
177 "group_norm_backward",
178 "gt",
179 "gt_scalar",
180 "hardsigmoid",
181 "hardsigmoid_out",
182 "hardswish_",
183 "histc",
184 "hstack",
185 "hypot",
186 "i0",
187 "i0_",
188 "i0_out",
189 "index_add",
190 "index_add_",
191 "index_copy",
192 "index_copy_",
193 "index_put",
194 "index_put_",
195 "isclose",
196 "isfinite",
197 "isinf",
198 "isnan",
199 "isneginf",
200 "isneginf_out",
201 "kron",
202 "layer_norm",
203 "layer_norm_backward",
204 "le",
205 "le_scalar",
206 "leaky_relu",
207 "leaky_relu_",
208 "leaky_relu_out",
209 "lerp_scalar",
210 "lerp_scalar_",
211 "lerp_tensor",
212 "lerp_tensor_",
213 "lift_fresh_copy",
214 "linspace",
215 "log",
216 "log10",
217 "log10_",
218 "log10_out",
219 "log1p_",
220 "log_sigmoid",
221 "log_softmax_backward",
222 "log_softmax_backward_out",
223 "log_softmax_out",
224 "logaddexp",
225 "logaddexp_out",
226 "logical_and",
227 "logical_and_",
228 "logical_not",
229 "logical_or",
230 "logical_or_",
231 "logical_xor",
232 "logit",
233 "logit_",
234 "logit_out",
235 "logspace",
236 "logsumexp",
237 "lt_scalar",
238 "margin_ranking_loss",
239 "masked_fill_",
240 "masked_scatter",
241 "masked_scatter_",
242 "masked_select",
243 "max_dim",
244 "max_pool2d_backward",
245 "max_pool2d_with_indices",
246 "max_pool3d_backward",
247 "max_pool3d_with_indices",
248 "maximum",
249 "median",
250 "median_dim",
251 "median_dim_values",
252 "median_out",
253 "min_dim",
254 "minimum",
255 "mse_loss",
256 "mv",
257 "nan_to_num",
258 "ne",
259 "ne_scalar",
260 "new_full",
261 "nll_loss2d_backward",
262 "nll_loss2d_forward",
263 "nll_loss_backward",
264 "nll_loss_forward",
265 "nll_loss_nd_backward",
266 "nll_loss_nd_forward",
267 "nonzero",
268 "nonzero_numpy",
269 "normal_",
270 "normal_float_tensor",
271 "normal_tensor_float",
272 "normal_tensor_tensor",
273 "normed_cumsum",
274 "one_hot",
275 "pad",
276 "pixel_shuffle",
277 "pixel_unshuffle",
278 "pixel_unshuffle_out",
279 "poisson",
280 "polar",
281 "prelu",
282 "prod",
283 "prod_dim",
284 "rand",
285 "rand_like",
286 "randn",
287 "randn_like",
288 "randperm",
289 "reciprocal",
290 "reciprocal_",
291 "reflection_pad1d",
292 "reflection_pad1d_out",
293 "reflection_pad2d",
294 "reflection_pad2d_out",
295 "relu",
296 "relu6",
297 "relu_",
298 "repeat",
299 "repeat_interleave_self_int",
300 "repeat_interleave_self_tensor",
301 "repeat_interleave_tensor",
302 "replication_pad1d",
303 "replication_pad1d_out",
304 "replication_pad3d",
305 "resolve_conj",
306 "resolve_neg",
307 "rms_norm",
308 "roll",
309 "round",
310 "round_",
311 "round_out",
312 "rrelu_with_noise_backward",
313 "rsub_scalar",
314 "rsub_tensor",
315 "scaled_softmax_backward",
316 "scaled_softmax_forward",
317 "scatter_",
318 "scatter_add_",
319 "scatter_reduce",
320 "scatter_reduce_",
321 "scatter_reduce_out",
322 "select_backward",
323 "select_scatter",
324 "selu",
325 "selu_",
326 "sgn_",
327 "sigmoid",
328 "sigmoid_",
329 "sigmoid_backward",
330 "signbit",
331 "signbit_out",
332 "silu_",
333 "silu_backward",
334 "sin_",
335 "sinh_",
336 "slice_backward",
337 "slice_scatter",
338 "smooth_l1_loss",
339 "smooth_l1_loss_backward",
340 "smooth_l1_loss_out",
341 "soft_margin_loss",
342 "softmax_backward",
343 "softmax_backward_out",
344 "softmax_out",
345 "softplus",
346 "softshrink",
347 "softshrink_out",
348 "sort_stable",
349 "special_i0e",
350 "special_i0e_out",
351 "special_i1",
352 "special_i1_out",
353 "sqrt",
354 "sqrt_",
355 "square",
356 "square_",
357 "square_out",
358 "stack",
359 "std",
360 "sub_",
361 "sum_dim",
362 "sum_dim_out",
363 "sum_out",
364 "svd",
365 "t_copy",
366 "t_copy_out",
367 "tan",
368 "tan_",
369 "tanh",
370 "tanh_",
371 "tanh_backward",
372 "threshold",
373 "threshold_backward",
374 "tile",
375 "trace",
376 "tril",
377 "tril_",
378 "tril_out",
379 "triu",
380 "triu_",
381 "true_divide_out",
382 "unfold_backward",
383 "uniform_",
384 "unique_consecutive",
385 "upsample_bicubic2d",
386 "upsample_linear1d",
387 "upsample_nearest1d",
388 "upsample_nearest2d",
389 "upsample_nearest3d",
390 "var",
391 "var_correction",
392 "var_dim",
393 "var_mean",
394 "vdot",
395 "vector_norm",
396 "vstack",
397 "weight_norm_interface",
398 "weight_norm_interface_backward",
399 "where_self",
400 "zero",
401 "zero_",
402 "zero_out",
403 "add",
404 "add_",
405 "copy_",
406 "cat",
407 "index",
408 "ones_like",
409 "mul",
410 "to_copy",
411 "mul_",
412 "zeros_like",
413)
416__all__ = ["*"]