Coverage for src/flag_gems/runtime/backend/_arm/__init__.py: 0%
4 statements
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-05 07:36 +0800
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-05 07:36 +0800
1from backend_utils import VendorInfoBase # noqa: E402
3vendor_info = VendorInfoBase(
4 vendor_name="arm", device_name="cpu", device_query_cmd="cat /proc/cpuinfo"
5)
7# Ops listed here are excluded from the ARM customized registry.
8# Auto-generated from upstream _FULL_CONFIG (456 funcs) - _arm/ops/__all__ (63 funcs)
9# Principle: only register _arm impls we've validated to beat ATen native.
10# All other entries from _FULL_CONFIG fall through to PyTorch ATen on ARM CPU.
11CUSTOMIZED_UNUSED_OPS = (
12 "_assert_async",
13 "_conv_depthwise2d",
14 "_index_put_impl_",
15 "_is_all_true",
16 "_safe_softmax",
17 "_unique2",
18 "_upsample_bicubic2d_aa",
19 "_upsample_bicubic2d_aa_backward",
20 "_upsample_nearest_exact1d",
21 "abs",
22 "abs_",
23 "absolute",
24 "acos",
25 "addcdiv",
26 "addcdiv_out",
27 "addcmul",
28 "addcmul_out",
29 "addmm_dtype",
30 "addmm_dtype_out",
31 "addmv",
32 "addmv_out",
33 "addr",
34 "affine_grid_generator",
35 "alias_copy",
36 "all_dim",
37 "all_dims",
38 "allclose",
39 "amax",
40 "aminmax",
41 "angle",
42 "any_dim",
43 "any_dims",
44 "arange_start",
45 "arcsinh",
46 "arcsinh_",
47 "arcsinh_out",
48 "arctanh_",
49 "argmin",
50 "asinh",
51 "asinh_",
52 "asinh_out",
53 "atan",
54 "atan2",
55 "atan2_out",
56 "atan_",
57 "avg_pool2d",
58 "avg_pool2d_backward",
59 "avg_pool3d",
60 "avg_pool3d_backward",
61 "baddbmm",
62 "batch_norm",
63 "batch_norm_backward",
64 "bernoulli_",
65 "bincount",
66 "bitwise_and_scalar",
67 "bitwise_and_scalar_",
68 "bitwise_and_scalar_tensor",
69 "bitwise_and_tensor",
70 "bitwise_and_tensor_",
71 "bitwise_left_shift",
72 "bitwise_not",
73 "bitwise_not_",
74 "bitwise_or_scalar",
75 "bitwise_or_scalar_",
76 "bitwise_or_scalar_tensor",
77 "bitwise_or_tensor",
78 "bitwise_or_tensor_",
79 "bitwise_right_shift",
80 "bmm_out",
81 "cat_out",
82 "ceil",
83 "ceil_",
84 "ceil_out",
85 "celu",
86 "celu_",
87 "clamp",
88 "clamp_",
89 "clamp_min",
90 "clamp_min_",
91 "clamp_tensor",
92 "clamp_tensor_",
93 "clip",
94 "clip_",
95 "col2im",
96 "concatenate",
97 "conj_physical",
98 "constant_pad_nd",
99 "conv1d",
100 "conv2d",
101 "conv3d",
102 "conv_transpose1d",
103 "copysign",
104 "copysign_out",
105 "cos_",
106 "cosh",
107 "cosh_",
108 "cosh_out",
109 "count_nonzero",
110 "ctc_loss",
111 "cudnn_convolution",
112 "cummax",
113 "cummin",
114 "cumprod",
115 "cumprod_",
116 "cumsum_out",
117 "diag",
118 "diag_embed",
119 "diagonal_backward",
120 "diff",
121 "digamma_",
122 "dot",
123 "dropout",
124 "dropout_backward",
125 "elu",
126 "elu_",
127 "elu_backward",
128 "embedding_backward",
129 "embedding_dense_backward",
130 "eq",
131 "eq_scalar",
132 "equal",
133 "erf",
134 "erf_",
135 "exp",
136 "exp2",
137 "exp2_",
138 "exp_",
139 "exp_out",
140 "expm1",
141 "expm1_",
142 "expm1_out",
143 "eye",
144 "eye_m",
145 "feature_dropout",
146 "feature_dropout_",
147 "fill_scalar",
148 "fill_scalar_",
149 "fill_scalar_out",
150 "fill_tensor",
151 "fill_tensor_",
152 "fill_tensor_out",
153 "flash_attention_forward",
154 "flip",
155 "floor_",
156 "fmin",
157 "fmin_out",
158 "fmod_scalar",
159 "fmod_scalar_",
160 "fmod_tensor",
161 "fmod_tensor_",
162 "full_like",
163 "gather_backward",
164 "gcd",
165 "gcd_out",
166 "ge",
167 "ge_scalar",
168 "gelu_",
169 "gelu_backward",
170 "glu",
171 "glu_backward",
172 "greater",
173 "greater_out",
174 "greater_scalar",
175 "greater_scalar_out",
176 "grid_sample",
177 "group_mm",
178 "group_norm",
179 "group_norm_backward",
180 "gt",
181 "gt_scalar",
182 "hardsigmoid",
183 "hardsigmoid_out",
184 "hardswish_",
185 "histc",
186 "hstack",
187 "hypot",
188 "i0",
189 "i0_",
190 "i0_out",
191 "index_add",
192 "index_add_",
193 "index_copy",
194 "index_copy_",
195 "index_put",
196 "index_put_",
197 "isclose",
198 "isfinite",
199 "isinf",
200 "isnan",
201 "isneginf",
202 "isneginf_out",
203 "kron",
204 "layer_norm",
205 "layer_norm_backward",
206 "le",
207 "le_scalar",
208 "leaky_relu",
209 "leaky_relu_",
210 "leaky_relu_out",
211 "lerp_scalar",
212 "lerp_scalar_",
213 "lerp_tensor",
214 "lerp_tensor_",
215 "lift_fresh_copy",
216 "linspace",
217 "log",
218 "log10",
219 "log10_",
220 "log10_out",
221 "log1p_",
222 "log_sigmoid",
223 "log_softmax_backward",
224 "log_softmax_backward_out",
225 "log_softmax_out",
226 "logaddexp",
227 "logaddexp_out",
228 "logical_and",
229 "logical_and_",
230 "logical_not",
231 "logical_or",
232 "logical_or_",
233 "logical_xor",
234 "logit",
235 "logit_",
236 "logit_out",
237 "logspace",
238 "logsumexp",
239 "lt_scalar",
240 "margin_ranking_loss",
241 "masked_fill_",
242 "masked_scatter",
243 "masked_scatter_",
244 "masked_select",
245 "max_dim",
246 "max_pool2d_backward",
247 "max_pool2d_with_indices",
248 "max_pool3d_backward",
249 "max_pool3d_with_indices",
250 "maximum",
251 "median",
252 "median_dim",
253 "median_dim_values",
254 "median_out",
255 "min_dim",
256 "minimum",
257 "mse_loss",
258 "mv",
259 "nan_to_num",
260 "ne",
261 "ne_scalar",
262 "new_full",
263 "nll_loss2d_backward",
264 "nll_loss2d_forward",
265 "nll_loss_backward",
266 "nll_loss_forward",
267 "nll_loss_nd_backward",
268 "nll_loss_nd_forward",
269 "nonzero",
270 "nonzero_numpy",
271 "normal_",
272 "normal_float_tensor",
273 "normal_tensor_float",
274 "normal_tensor_tensor",
275 "normed_cumsum",
276 "one_hot",
277 "pad",
278 "pixel_shuffle",
279 "pixel_unshuffle",
280 "pixel_unshuffle_out",
281 "poisson",
282 "polar",
283 "prelu",
284 "prod",
285 "prod_dim",
286 "rand",
287 "rand_like",
288 "randn",
289 "randn_like",
290 "randperm",
291 "reciprocal",
292 "reciprocal_",
293 "reflection_pad1d",
294 "reflection_pad1d_out",
295 "reflection_pad2d",
296 "reflection_pad2d_out",
297 "relu",
298 "relu6",
299 "relu_",
300 "repeat",
301 "repeat_interleave_self_int",
302 "repeat_interleave_self_tensor",
303 "repeat_interleave_tensor",
304 "replication_pad1d",
305 "replication_pad1d_out",
306 "replication_pad3d",
307 "resolve_conj",
308 "resolve_neg",
309 "rms_norm",
310 "roll",
311 "round",
312 "round_",
313 "round_out",
314 "rrelu_with_noise_backward",
315 "rsub_scalar",
316 "rsub_tensor",
317 "scaled_softmax_backward",
318 "scaled_softmax_forward",
319 "scatter_",
320 "scatter_add_",
321 "scatter_reduce",
322 "scatter_reduce_",
323 "scatter_reduce_out",
324 "select_backward",
325 "select_scatter",
326 "selu",
327 "selu_",
328 "sgn_",
329 "sigmoid",
330 "sigmoid_",
331 "sigmoid_backward",
332 "signbit",
333 "signbit_out",
334 "silu_",
335 "silu_backward",
336 "sin_",
337 "sinh_",
338 "slice_backward",
339 "slice_scatter",
340 "smooth_l1_loss",
341 "smooth_l1_loss_backward",
342 "smooth_l1_loss_out",
343 "soft_margin_loss",
344 "softmax_backward",
345 "softmax_backward_out",
346 "softmax_out",
347 "softplus",
348 "softshrink",
349 "softshrink_out",
350 "sort_stable",
351 "special_i0e",
352 "special_i0e_out",
353 "special_i1",
354 "special_i1_out",
355 "sqrt",
356 "sqrt_",
357 "square",
358 "square_",
359 "square_out",
360 "stack",
361 "std",
362 "sub_",
363 "sum_dim",
364 "sum_dim_out",
365 "sum_out",
366 "svd",
367 "t_copy",
368 "t_copy_out",
369 "tan",
370 "tan_",
371 "tanh",
372 "tanh_",
373 "tanh_backward",
374 "threshold",
375 "threshold_backward",
376 "tile",
377 "trace",
378 "tril",
379 "tril_",
380 "tril_out",
381 "triu",
382 "triu_",
383 "true_divide_out",
384 "unfold_backward",
385 "uniform_",
386 "unique_consecutive",
387 "upsample_bicubic2d",
388 "upsample_linear1d",
389 "upsample_nearest1d",
390 "upsample_nearest2d",
391 "upsample_nearest3d",
392 "var",
393 "var_correction",
394 "var_dim",
395 "var_mean",
396 "vdot",
397 "vector_norm",
398 "vstack",
399 "weight_norm_interface",
400 "weight_norm_interface_backward",
401 "where_self",
402 "zero",
403 "zero_",
404 "zero_out",
405 "add",
406 "add_",
407 "copy_",
408 "cat",
409 "index",
410 "ones_like",
411 "mul",
412 "to_copy",
413 "mul_",
414 "zeros_like",
415)
418__all__ = ["*"]