Coverage for src/flag_gems/ops/__init__.py: 100%
293 statements
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-05 07:36 +0800
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-05 07:36 +0800
1from flag_gems.ops._euclidean_dist import _euclidean_dist
2from flag_gems.ops._functional_sym_constrain_range_for_size import (
3 _functional_sym_constrain_range_for_size,
4)
5from flag_gems.ops._is_all_true import _is_all_true
6from flag_gems.ops._safe_softmax import _safe_softmax
7from flag_gems.ops._upsample_nearest_exact1d import _upsample_nearest_exact1d
8from flag_gems.ops.abs import abs, abs_
9from flag_gems.ops.absolute import absolute
10from flag_gems.ops.acos import acos
11from flag_gems.ops.act_quant import act_quant_triton
12from flag_gems.ops.add import add, add_
13from flag_gems.ops.addcdiv import addcdiv, addcdiv_out
14from flag_gems.ops.addcmul import addcmul, addcmul_out
15from flag_gems.ops.addmm import addmm, addmm_dtype, addmm_dtype_out, addmm_out
16from flag_gems.ops.addmv import addmv, addmv_out
17from flag_gems.ops.addr import addr
18from flag_gems.ops.affine_grid_generator import affine_grid_generator
19from flag_gems.ops.alias_copy import alias_copy, alias_copy_out
20from flag_gems.ops.all import all, all_dim, all_dims
21from flag_gems.ops.amax import amax
22from flag_gems.ops.aminmax import aminmax
23from flag_gems.ops.angle import angle
24from flag_gems.ops.any import any, any_dim, any_dims
25from flag_gems.ops.arange import arange, arange_start
26from flag_gems.ops.arcsinh import arcsinh, arcsinh_out
27from flag_gems.ops.arcsinh_ import arcsinh_
28from flag_gems.ops.arctanh_ import arctanh_
29from flag_gems.ops.argmax import argmax
30from flag_gems.ops.argmin import argmin
31from flag_gems.ops.argsort import argsort
32from flag_gems.ops.as_strided_copy import as_strided_copy, as_strided_copy_out
33from flag_gems.ops.asinh import asinh, asinh_out
34from flag_gems.ops.asinh_ import asinh_
35from flag_gems.ops.assert_async import _assert_async
36from flag_gems.ops.atan import atan, atan_
37from flag_gems.ops.atan2 import atan2, atan2_out
38from flag_gems.ops.attention import (
39 ScaleDotProductAttention,
40 flash_attention_forward,
41 flash_attn_varlen_func,
42 flash_attn_varlen_opt_func,
43 scaled_dot_product_attention,
44 scaled_dot_product_attention_backward,
45 scaled_dot_product_attention_forward,
46)
47from flag_gems.ops.avg_pool2d import avg_pool2d, avg_pool2d_backward
48from flag_gems.ops.avg_pool3d import avg_pool3d, avg_pool3d_backward
49from flag_gems.ops.baddbmm import baddbmm, baddbmm_out
50from flag_gems.ops.batch_norm import batch_norm, batch_norm_backward
51from flag_gems.ops.bernoulli_ import bernoulli_
52from flag_gems.ops.bincount import bincount
53from flag_gems.ops.bitwise_and import (
54 bitwise_and_scalar,
55 bitwise_and_scalar_,
56 bitwise_and_scalar_tensor,
57 bitwise_and_tensor,
58 bitwise_and_tensor_,
59)
60from flag_gems.ops.bitwise_left_shift import bitwise_left_shift
61from flag_gems.ops.bitwise_not import bitwise_not, bitwise_not_
62from flag_gems.ops.bitwise_or import (
63 bitwise_or_scalar,
64 bitwise_or_scalar_,
65 bitwise_or_scalar_tensor,
66 bitwise_or_tensor,
67 bitwise_or_tensor_,
68)
69from flag_gems.ops.bitwise_right_shift import bitwise_right_shift
70from flag_gems.ops.bmm import bmm, bmm_out
71from flag_gems.ops.cat import cat, cat_out
72from flag_gems.ops.cauchy import cauchy, cauchy_
73from flag_gems.ops.ceil import ceil, ceil_, ceil_out
74from flag_gems.ops.celu import celu, celu_
75from flag_gems.ops.clamp import (
76 clamp,
77 clamp_,
78 clamp_min,
79 clamp_min_,
80 clamp_tensor,
81 clamp_tensor_,
82)
83from flag_gems.ops.clamp_max import clamp_max, clamp_max_ # noqa: F401
84from flag_gems.ops.clip import clip, clip_
85from flag_gems.ops.col2im import col2im
86from flag_gems.ops.concatenate import concatenate
87from flag_gems.ops.conj_physical import conj_physical
88from flag_gems.ops.contiguous import contiguous
89from flag_gems.ops.conv1d import conv1d
90from flag_gems.ops.conv2d import conv2d
91from flag_gems.ops.conv3d import conv3d
92from flag_gems.ops.conv_depthwise2d import _conv_depthwise2d
93from flag_gems.ops.conv_transpose1d import conv_transpose1d
94from flag_gems.ops.conv_transpose2d import conv_transpose2d
95from flag_gems.ops.copy import copy, copy_
96from flag_gems.ops.copysign import copysign, copysign_out
97from flag_gems.ops.cos import cos, cos_
98from flag_gems.ops.cosh import cosh, cosh_, cosh_out
99from flag_gems.ops.count_nonzero import count_nonzero
100from flag_gems.ops.ctc_loss import ctc_loss
101from flag_gems.ops.cudnn_convolution import cudnn_convolution
102from flag_gems.ops.cummax import cummax
103from flag_gems.ops.cummin import cummin
104from flag_gems.ops.cumprod import cumprod, cumprod_
105from flag_gems.ops.cumsum import cumsum, cumsum_out, normed_cumsum
106from flag_gems.ops.diag import diag
107from flag_gems.ops.diag_embed import diag_embed
108from flag_gems.ops.diagonal import diagonal_backward
109from flag_gems.ops.diff import diff
110from flag_gems.ops.digamma_ import digamma_
111from flag_gems.ops.div import (
112 div_mode,
113 div_mode_,
114 floor_divide,
115 floor_divide_,
116 true_divide,
117 true_divide_,
118 true_divide_out,
119)
120from flag_gems.ops.dot import dot
121from flag_gems.ops.dropout import dropout, dropout_backward
122from flag_gems.ops.elu import elu, elu_, elu_backward
123from flag_gems.ops.embedding import embedding, embedding_backward
124from flag_gems.ops.embedding_dense_backward import embedding_dense_backward
125from flag_gems.ops.eq import eq, eq_scalar, equal
126from flag_gems.ops.erf import erf, erf_
127from flag_gems.ops.exp import exp, exp_, exp_out
128from flag_gems.ops.exp2 import exp2, exp2_
129from flag_gems.ops.expm1 import expm1, expm1_, expm1_out
130from flag_gems.ops.exponential_ import exponential_
131from flag_gems.ops.eye import eye
132from flag_gems.ops.eye_m import eye_m
133from flag_gems.ops.feature_dropout import feature_dropout, feature_dropout_
134from flag_gems.ops.fft import fft
135from flag_gems.ops.fill import (
136 fill_scalar,
137 fill_scalar_,
138 fill_scalar_out,
139 fill_tensor,
140 fill_tensor_,
141 fill_tensor_out,
142)
143from flag_gems.ops.flip import flip
144from flag_gems.ops.floor import floor, floor_out
145from flag_gems.ops.floor_ import floor_
146from flag_gems.ops.fmin import fmin, fmin_out
147from flag_gems.ops.fmod import fmod_scalar, fmod_scalar_, fmod_tensor, fmod_tensor_
148from flag_gems.ops.fp8_matmul import fp8_matmul
149from flag_gems.ops.fp8_mqa_logits import fp8_mqa_logits
150from flag_gems.ops.full import full
151from flag_gems.ops.full_like import full_like
152from flag_gems.ops.gather import gather, gather_backward
153from flag_gems.ops.gcd import gcd, gcd_out
154from flag_gems.ops.ge import ge, ge_scalar
155from flag_gems.ops.gelu import gelu, gelu_, gelu_backward
156from flag_gems.ops.get_paged_mqa_logits_metadata import get_paged_mqa_logits_metadata
157from flag_gems.ops.get_scheduler_metadata import get_scheduler_metadata
158from flag_gems.ops.glu import glu, glu_backward
159from flag_gems.ops.greater import (
160 greater,
161 greater_out,
162 greater_scalar,
163 greater_scalar_out,
164)
165from flag_gems.ops.grid_sample import grid_sample
166from flag_gems.ops.group_gemm import group_mm
167from flag_gems.ops.groupnorm import group_norm, group_norm_backward
168from flag_gems.ops.gt import gt, gt_scalar
169from flag_gems.ops.hadamard_transform import (
170 hadamard_transform,
171 hadamard_transform_12N,
172 hadamard_transform_20N,
173 hadamard_transform_28N,
174 hadamard_transform_40N,
175)
176from flag_gems.ops.hardsigmoid import hardsigmoid, hardsigmoid_out
177from flag_gems.ops.hardswish_ import hardswish_
178from flag_gems.ops.histc import histc
179from flag_gems.ops.hstack import hstack
180from flag_gems.ops.hypot import hypot, hypot_out
181from flag_gems.ops.i0 import i0, i0_out
182from flag_gems.ops.i0_ import i0_
183from flag_gems.ops.index import index
184from flag_gems.ops.index_add import index_add, index_add_
185from flag_gems.ops.index_copy_ import index_copy, index_copy_
186from flag_gems.ops.index_put import _index_put_impl_, index_put, index_put_
187from flag_gems.ops.index_select import index_select
188from flag_gems.ops.isclose import allclose, isclose
189from flag_gems.ops.isfinite import isfinite
190from flag_gems.ops.isin import isin
191from flag_gems.ops.isinf import isinf
192from flag_gems.ops.isnan import isnan
193from flag_gems.ops.isneginf import isneginf, isneginf_out
194from flag_gems.ops.kron import kron
195from flag_gems.ops.layernorm import layer_norm, layer_norm_backward
196from flag_gems.ops.le import le, le_scalar
197from flag_gems.ops.leaky_relu import leaky_relu, leaky_relu_, leaky_relu_out
198from flag_gems.ops.lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_
199from flag_gems.ops.lift_fresh_copy import lift_fresh_copy, lift_fresh_copy_out
200from flag_gems.ops.linspace import linspace
201from flag_gems.ops.log import log
202from flag_gems.ops.log1p import log1p
203from flag_gems.ops.log1p_ import log1p_
204from flag_gems.ops.log10 import log10, log10_, log10_out
205from flag_gems.ops.log_sigmoid import log_sigmoid
206from flag_gems.ops.log_softmax import (
207 log_softmax,
208 log_softmax_backward,
209 log_softmax_backward_out,
210 log_softmax_out,
211)
212from flag_gems.ops.logaddexp import logaddexp, logaddexp_out
213from flag_gems.ops.logical_and import logical_and, logical_and_
214from flag_gems.ops.logical_not import logical_not
215from flag_gems.ops.logical_or import logical_or, logical_or_
216from flag_gems.ops.logical_xor import logical_xor
217from flag_gems.ops.logit import logit, logit_out
218from flag_gems.ops.logit_ import logit_
219from flag_gems.ops.logspace import logspace
220from flag_gems.ops.logsumexp import logsumexp
221from flag_gems.ops.lt import lt, lt_scalar
222from flag_gems.ops.margin_ranking_loss import margin_ranking_loss
223from flag_gems.ops.masked_fill import masked_fill, masked_fill_
224from flag_gems.ops.masked_scatter import masked_scatter, masked_scatter_
225from flag_gems.ops.masked_select import masked_select
226from flag_gems.ops.max import max, max_dim
227from flag_gems.ops.max_pool2d_with_indices import (
228 max_pool2d_backward,
229 max_pool2d_with_indices,
230)
231from flag_gems.ops.max_pool3d_with_indices import (
232 max_pool3d_backward,
233 max_pool3d_with_indices,
234)
235from flag_gems.ops.maximum import maximum
236from flag_gems.ops.mean import mean, mean_dim
237from flag_gems.ops.median import median, median_dim, median_dim_values, median_out
238from flag_gems.ops.min import min, min_dim
239from flag_gems.ops.minimum import minimum
240from flag_gems.ops.mm import mm, mm_out, router_gemm
241from flag_gems.ops.mse_loss import mse_loss
242from flag_gems.ops.mul import mul, mul_
243from flag_gems.ops.multinomial import multinomial
244from flag_gems.ops.mv import mv
245from flag_gems.ops.nan_to_num import nan_to_num
246from flag_gems.ops.ne import ne, ne_scalar
247from flag_gems.ops.neg import neg, neg_
248from flag_gems.ops.new_full import new_full
249from flag_gems.ops.nll_loss_nd import nll_loss_nd_backward, nll_loss_nd_forward
250from flag_gems.ops.nllloss import (
251 nll_loss2d_backward,
252 nll_loss2d_forward,
253 nll_loss_backward,
254 nll_loss_forward,
255)
256from flag_gems.ops.nonzero import nonzero
257from flag_gems.ops.nonzero_numpy import nonzero_numpy
258from flag_gems.ops.normal import (
259 normal_,
260 normal_float_tensor,
261 normal_tensor_float,
262 normal_tensor_tensor,
263)
264from flag_gems.ops.one_hot import one_hot
265from flag_gems.ops.ones import ones
266from flag_gems.ops.ones_like import ones_like
267from flag_gems.ops.pad import constant_pad_nd, pad
268from flag_gems.ops.per_token_group_quant_fp8 import (
269 SUPPORTED_FP8_DTYPE,
270 per_token_group_quant_fp8,
271)
272from flag_gems.ops.pixel_shuffle import pixel_shuffle
273from flag_gems.ops.pixel_unshuffle import pixel_unshuffle, pixel_unshuffle_out
274from flag_gems.ops.poisson import poisson
275from flag_gems.ops.polar import polar
276from flag_gems.ops.pow import (
277 pow_scalar,
278 pow_tensor_scalar,
279 pow_tensor_scalar_,
280 pow_tensor_tensor,
281 pow_tensor_tensor_,
282)
283from flag_gems.ops.prelu import prelu
284from flag_gems.ops.prod import prod, prod_dim
285from flag_gems.ops.quantile import quantile
286from flag_gems.ops.rad2deg import rad2deg, rad2deg_
287from flag_gems.ops.rand import rand
288from flag_gems.ops.rand_like import rand_like
289from flag_gems.ops.randint import randint
290from flag_gems.ops.randint_like import randint_like
291from flag_gems.ops.randn import randn
292from flag_gems.ops.randn_like import randn_like
293from flag_gems.ops.randperm import randperm
294from flag_gems.ops.reciprocal import reciprocal, reciprocal_
295from flag_gems.ops.reflection_pad1d import reflection_pad1d, reflection_pad1d_out
296from flag_gems.ops.reflection_pad1d_backward import reflection_pad1d_backward
297from flag_gems.ops.reflection_pad2d import reflection_pad2d, reflection_pad2d_out
298from flag_gems.ops.relu import relu, relu_
299from flag_gems.ops.relu6 import relu6
300from flag_gems.ops.remainder import remainder, remainder_
301from flag_gems.ops.renorm import renorm, renorm_
302from flag_gems.ops.repeat import repeat
303from flag_gems.ops.repeat_interleave import (
304 repeat_interleave_self_int,
305 repeat_interleave_self_tensor,
306 repeat_interleave_tensor,
307)
308from flag_gems.ops.replication_pad1d import replication_pad1d, replication_pad1d_out
309from flag_gems.ops.replication_pad3d import replication_pad3d
310from flag_gems.ops.resolve_conj import resolve_conj
311from flag_gems.ops.resolve_neg import resolve_neg
312from flag_gems.ops.rms_norm import rms_norm, rms_norm_backward, rms_norm_forward
313from flag_gems.ops.roll import roll
314from flag_gems.ops.round import round, round_, round_out
315from flag_gems.ops.rrelu_with_noise_backward import rrelu_with_noise_backward
316from flag_gems.ops.rsqrt import rsqrt, rsqrt_
317from flag_gems.ops.rsub import rsub_scalar, rsub_tensor
318from flag_gems.ops.scaled_mm import scaled_mm, scaled_mm_out
319from flag_gems.ops.scaled_softmax import scaled_softmax_backward, scaled_softmax_forward
320from flag_gems.ops.scatter import scatter, scatter_
321from flag_gems.ops.scatter_add_ import scatter_add_
322from flag_gems.ops.scatter_reduce import (
323 scatter_reduce,
324 scatter_reduce_,
325 scatter_reduce_out,
326)
327from flag_gems.ops.select_backward import select_backward
328from flag_gems.ops.select_scatter import select_scatter
329from flag_gems.ops.selu import selu
330from flag_gems.ops.selu_ import selu_
331from flag_gems.ops.sgn_ import sgn_
332from flag_gems.ops.sigmoid import sigmoid, sigmoid_, sigmoid_backward
333from flag_gems.ops.signbit import signbit, signbit_out
334from flag_gems.ops.silu import silu, silu_, silu_backward
335from flag_gems.ops.sin import sin, sin_
336from flag_gems.ops.sinh_ import sinh_
337from flag_gems.ops.slice_backward import slice_backward
338from flag_gems.ops.slice_scatter import slice_scatter
339from flag_gems.ops.smooth_l1_loss import (
340 smooth_l1_loss,
341 smooth_l1_loss_backward,
342 smooth_l1_loss_out,
343)
344from flag_gems.ops.soft_margin_loss import soft_margin_loss, soft_margin_loss_out
345from flag_gems.ops.softmax import (
346 softmax,
347 softmax_backward,
348 softmax_backward_out,
349 softmax_out,
350)
351from flag_gems.ops.softplus import softplus
352from flag_gems.ops.softshrink import softshrink, softshrink_out
353from flag_gems.ops.sort import sort, sort_stable
354from flag_gems.ops.special_i0e import special_i0e, special_i0e_out
355from flag_gems.ops.special_i1 import special_i1, special_i1_out
356from flag_gems.ops.sqrt import sqrt, sqrt_
357from flag_gems.ops.square import square, square_, square_out
358from flag_gems.ops.stack import stack
359from flag_gems.ops.std import std
360from flag_gems.ops.sub import sub, sub_
361from flag_gems.ops.sum import sum, sum_dim, sum_dim_out, sum_out
362from flag_gems.ops.svd import svd
363from flag_gems.ops.t_copy import t_copy, t_copy_out
364from flag_gems.ops.tan import tan, tan_
365from flag_gems.ops.tanh import tanh, tanh_, tanh_backward
366from flag_gems.ops.threshold import threshold, threshold_backward
367from flag_gems.ops.tile import tile
368from flag_gems.ops.to import to_copy
369from flag_gems.ops.topk import topk
370from flag_gems.ops.trace import trace
371from flag_gems.ops.tril import tril, tril_, tril_out
372from flag_gems.ops.triu import triu, triu_
373from flag_gems.ops.unfold_backward import unfold_backward
374from flag_gems.ops.uniform import uniform_
375from flag_gems.ops.unique import _unique2
376from flag_gems.ops.unique_consecutive import unique_consecutive
377from flag_gems.ops.upsample_bicubic2d import upsample_bicubic2d
378from flag_gems.ops.upsample_bicubic2d_aa import _upsample_bicubic2d_aa
379from flag_gems.ops.upsample_bicubic2d_aa_backward import _upsample_bicubic2d_aa_backward
380from flag_gems.ops.upsample_linear1d import upsample_linear1d
381from flag_gems.ops.upsample_nearest1d import upsample_nearest1d
382from flag_gems.ops.upsample_nearest2d import upsample_nearest2d
383from flag_gems.ops.upsample_nearest3d import upsample_nearest3d
384from flag_gems.ops.var import var, var_correction, var_dim
385from flag_gems.ops.var_mean import var_mean
386from flag_gems.ops.vdot import vdot
387from flag_gems.ops.vector_norm import vector_norm
388from flag_gems.ops.vstack import vstack
389from flag_gems.ops.w8a8_block_fp8_matmul import w8a8_block_fp8_matmul
390from flag_gems.ops.weightnorm import (
391 weight_norm_interface,
392 weight_norm_interface_backward,
393)
394from flag_gems.ops.where import (
395 where_scalar_other,
396 where_scalar_self,
397 where_self,
398 where_self_out,
399)
400from flag_gems.ops.zero import zero, zero_out
401from flag_gems.ops.zeros import zero_, zeros
402from flag_gems.ops.zeros_like import zeros_like
404__all__ = [
405 "_assert_async",
406 "_conv_depthwise2d",
407 "_euclidean_dist",
408 "_functional_sym_constrain_range_for_size",
409 "_index_put_impl_",
410 "_is_all_true",
411 "_safe_softmax",
412 "_unique2",
413 "_upsample_bicubic2d_aa",
414 "_upsample_bicubic2d_aa_backward",
415 "_upsample_nearest_exact1d",
416 "abs",
417 "abs_",
418 "absolute",
419 "acos",
420 "act_quant_triton",
421 "add",
422 "add_",
423 "addcdiv",
424 "addcdiv_out",
425 "addcmul",
426 "addcmul_out",
427 "addmm",
428 "addmm_dtype",
429 "addmm_dtype_out",
430 "addmm_out",
431 "addmv",
432 "addmv_out",
433 "addr",
434 "affine_grid_generator",
435 "alias_copy",
436 "alias_copy_out",
437 "all",
438 "all_dim",
439 "all_dims",
440 "allclose",
441 "amax",
442 "aminmax",
443 "angle",
444 "any",
445 "any_dim",
446 "any_dims",
447 "arange",
448 "arange_start",
449 "arcsinh",
450 "arcsinh_",
451 "arcsinh_out",
452 "arctanh_",
453 "argmax",
454 "argmin",
455 "argsort",
456 "as_strided_copy",
457 "as_strided_copy_out",
458 "asinh",
459 "asinh_",
460 "asinh_out",
461 "atan",
462 "atan2",
463 "atan2_out",
464 "atan_",
465 "avg_pool2d",
466 "avg_pool2d_backward",
467 "avg_pool3d",
468 "avg_pool3d_backward",
469 "baddbmm",
470 "baddbmm_out",
471 "batch_norm",
472 "batch_norm_backward",
473 "bernoulli_",
474 "bincount",
475 "bitwise_and_scalar",
476 "bitwise_and_scalar_",
477 "bitwise_and_scalar_tensor",
478 "bitwise_and_tensor",
479 "bitwise_and_tensor_",
480 "bitwise_left_shift",
481 "bitwise_not",
482 "bitwise_not_",
483 "bitwise_or_scalar",
484 "bitwise_or_scalar_",
485 "bitwise_or_scalar_tensor",
486 "bitwise_or_tensor",
487 "bitwise_or_tensor_",
488 "bitwise_right_shift",
489 "bmm",
490 "bmm_out",
491 "cat",
492 "cat_out",
493 "cauchy",
494 "cauchy_",
495 "ceil",
496 "ceil_",
497 "ceil_out",
498 "celu",
499 "celu_",
500 "clamp",
501 "clamp_",
502 "clamp_max",
503 "clamp_max_",
504 "clamp_min",
505 "clamp_min_",
506 "clamp_tensor",
507 "clamp_tensor_",
508 "clip",
509 "clip_",
510 "col2im",
511 "concatenate",
512 "conj_physical",
513 "constant_pad_nd",
514 "contiguous",
515 "conv1d",
516 "conv2d",
517 "conv3d",
518 "conv_transpose1d",
519 "conv_transpose2d",
520 "copy",
521 "copy_",
522 "copysign",
523 "copysign_out",
524 "cos",
525 "cos_",
526 "cosh",
527 "cosh_",
528 "cosh_out",
529 "count_nonzero",
530 "ctc_loss",
531 "cudnn_convolution",
532 "cummax",
533 "cummin",
534 "cumprod",
535 "cumprod_",
536 "cumsum",
537 "cumsum_out",
538 "diag",
539 "diag_embed",
540 "diagonal_backward",
541 "diff",
542 "digamma_",
543 "div_mode",
544 "div_mode_",
545 "dot",
546 "dropout",
547 "dropout_backward",
548 "elu",
549 "elu_",
550 "elu_backward",
551 "embedding",
552 "embedding_backward",
553 "embedding_dense_backward",
554 "eq",
555 "eq_scalar",
556 "equal",
557 "erf",
558 "erf_",
559 "exp",
560 "exp2",
561 "exp2_",
562 "exp_",
563 "exp_out",
564 "expm1",
565 "expm1_",
566 "expm1_out",
567 "exponential_",
568 "eye",
569 "eye_m",
570 "feature_dropout",
571 "feature_dropout_",
572 "fft",
573 "fill_scalar",
574 "fill_scalar_",
575 "fill_scalar_out",
576 "fill_tensor",
577 "fill_tensor_",
578 "fill_tensor_out",
579 "flash_attention_forward",
580 "flash_attn_varlen_func",
581 "flash_attn_varlen_opt_func",
582 "flip",
583 "floor",
584 "floor_",
585 "floor_out",
586 "floor_divide",
587 "floor_divide_",
588 "fmin",
589 "fmin_out",
590 "fmod_scalar",
591 "fmod_scalar_",
592 "fmod_tensor",
593 "fmod_tensor_",
594 "fp8_matmul",
595 "fp8_mqa_logits",
596 "full",
597 "full_like",
598 "gather",
599 "gather_backward",
600 "gcd",
601 "gcd_out",
602 "ge",
603 "ge_scalar",
604 "gelu",
605 "gelu_",
606 "gelu_backward",
607 "get_paged_mqa_logits_metadata",
608 "get_scheduler_metadata",
609 "glu",
610 "glu_backward",
611 "greater",
612 "greater_out",
613 "greater_scalar",
614 "greater_scalar_out",
615 "grid_sample",
616 "group_mm",
617 "group_norm",
618 "group_norm_backward",
619 "gt",
620 "gt_scalar",
621 "hadamard_transform",
622 "hadamard_transform_12N",
623 "hadamard_transform_20N",
624 "hadamard_transform_28N",
625 "hadamard_transform_40N",
626 "hardsigmoid",
627 "hardsigmoid_out",
628 "hardswish_",
629 "histc",
630 "hstack",
631 "hypot",
632 "hypot_out",
633 "i0",
634 "i0_",
635 "i0_out",
636 "index",
637 "index_add",
638 "index_add_",
639 "index_copy",
640 "index_copy_",
641 "index_put",
642 "index_put_",
643 "index_select",
644 "isclose",
645 "isfinite",
646 "isin",
647 "isinf",
648 "isnan",
649 "isneginf",
650 "isneginf_out",
651 "kron",
652 "layer_norm",
653 "layer_norm_backward",
654 "le",
655 "le_scalar",
656 "leaky_relu",
657 "leaky_relu_",
658 "leaky_relu_out",
659 "lerp_scalar",
660 "lerp_scalar_",
661 "lerp_tensor",
662 "lerp_tensor_",
663 "lift_fresh_copy",
664 "lift_fresh_copy_out",
665 "linspace",
666 "log",
667 "log10",
668 "log10_",
669 "log10_out",
670 "log1p_",
671 "log_sigmoid",
672 "log_softmax",
673 "log_softmax_backward",
674 "log_softmax_backward_out",
675 "log_softmax_out",
676 "log1p",
677 "log1p_",
678 "logaddexp",
679 "logaddexp_out",
680 "logical_and",
681 "logical_and_",
682 "logical_not",
683 "logical_or",
684 "logical_or_",
685 "logical_xor",
686 "logit",
687 "logit_",
688 "logit_out",
689 "logspace",
690 "logsumexp",
691 "lt",
692 "lt_scalar",
693 "margin_ranking_loss",
694 "masked_fill",
695 "masked_fill_",
696 "masked_scatter",
697 "masked_scatter_",
698 "masked_select",
699 "max",
700 "max_dim",
701 "max_pool2d_backward",
702 "max_pool2d_with_indices",
703 "max_pool3d_backward",
704 "max_pool3d_with_indices",
705 "maximum",
706 "mean",
707 "mean_dim",
708 "median",
709 "median_dim",
710 "median_dim_values",
711 "median_out",
712 "min",
713 "min_dim",
714 "minimum",
715 "mm",
716 "mm_out",
717 "mse_loss",
718 "mul",
719 "mul_",
720 "multinomial",
721 "mv",
722 "nan_to_num",
723 "ne",
724 "ne_scalar",
725 "neg",
726 "neg_",
727 "new_full",
728 "nll_loss2d_backward",
729 "nll_loss2d_forward",
730 "nll_loss_backward",
731 "nll_loss_forward",
732 "nll_loss_nd_backward",
733 "nll_loss_nd_forward",
734 "nonzero",
735 "nonzero_numpy",
736 "normal_",
737 "normal_float_tensor",
738 "normal_tensor_float",
739 "normal_tensor_tensor",
740 "normed_cumsum",
741 "one_hot",
742 "ones",
743 "ones_like",
744 "pad",
745 "per_token_group_quant_fp8",
746 "pixel_shuffle",
747 "pixel_unshuffle",
748 "pixel_unshuffle_out",
749 "poisson",
750 "polar",
751 "pow_scalar",
752 "pow_tensor_scalar",
753 "pow_tensor_scalar_",
754 "pow_tensor_tensor",
755 "pow_tensor_tensor_",
756 "prelu",
757 "prod",
758 "prod_dim",
759 "quantile",
760 "rad2deg",
761 "rad2deg_",
762 "rand",
763 "rand_like",
764 "randint",
765 "randint_like",
766 "randn",
767 "randn_like",
768 "randperm",
769 "reciprocal",
770 "reciprocal_",
771 "reflection_pad1d",
772 "reflection_pad1d_backward",
773 "reflection_pad1d_out",
774 "reflection_pad2d",
775 "reflection_pad2d_out",
776 "relu",
777 "relu6",
778 "relu_",
779 "remainder",
780 "remainder_",
781 "renorm",
782 "renorm_",
783 "repeat",
784 "repeat_interleave_self_int",
785 "repeat_interleave_self_tensor",
786 "repeat_interleave_tensor",
787 "replication_pad1d",
788 "replication_pad1d_out",
789 "replication_pad3d",
790 "resolve_conj",
791 "resolve_neg",
792 "rms_norm",
793 "rms_norm_backward",
794 "rms_norm_forward",
795 "roll",
796 "round",
797 "round_",
798 "round_out",
799 "router_gemm",
800 "rrelu_with_noise_backward",
801 "rsqrt",
802 "rsqrt_",
803 "rsub_scalar",
804 "rsub_tensor",
805 "scaled_dot_product_attention",
806 "scaled_dot_product_attention_backward",
807 "scaled_dot_product_attention_forward",
808 "scaled_mm",
809 "scaled_mm_out",
810 "scaled_softmax_backward",
811 "scaled_softmax_forward",
812 "ScaleDotProductAttention",
813 "scatter",
814 "scatter_",
815 "scatter_add_",
816 "scatter_reduce",
817 "scatter_reduce_",
818 "scatter_reduce_out",
819 "select_backward",
820 "select_scatter",
821 "selu",
822 "selu_",
823 "sgn_",
824 "sigmoid",
825 "sigmoid_",
826 "sigmoid_backward",
827 "signbit",
828 "signbit_out",
829 "silu",
830 "silu_",
831 "silu_backward",
832 "sin",
833 "sin_",
834 "sinh_",
835 "slice_backward",
836 "slice_scatter",
837 "smooth_l1_loss",
838 "smooth_l1_loss_backward",
839 "smooth_l1_loss_out",
840 "soft_margin_loss",
841 "soft_margin_loss_out",
842 "softmax",
843 "softmax_backward",
844 "softmax_backward_out",
845 "softmax_out",
846 "softplus",
847 "softshrink",
848 "softshrink_out",
849 "sort",
850 "sort_stable",
851 "special_i0e",
852 "special_i0e_out",
853 "special_i1",
854 "special_i1_out",
855 "sqrt",
856 "sqrt_",
857 "square",
858 "square_",
859 "square_out",
860 "stack",
861 "std",
862 "sub",
863 "sub_",
864 "sum",
865 "sum_dim",
866 "sum_dim_out",
867 "sum_out",
868 "SUPPORTED_FP8_DTYPE",
869 "svd",
870 "t_copy",
871 "t_copy_out",
872 "tan",
873 "tan_",
874 "tanh",
875 "tanh_",
876 "tanh_backward",
877 "threshold",
878 "threshold_backward",
879 "tile",
880 "to_copy",
881 "topk",
882 "trace",
883 "tril",
884 "tril_",
885 "tril_out",
886 "triu",
887 "triu_",
888 "true_divide",
889 "true_divide_",
890 "true_divide_out",
891 "unfold_backward",
892 "uniform_",
893 "unique_consecutive",
894 "upsample_bicubic2d",
895 "upsample_linear1d",
896 "upsample_nearest1d",
897 "upsample_nearest2d",
898 "upsample_nearest3d",
899 "var",
900 "var_correction",
901 "var_dim",
902 "var_mean",
903 "vdot",
904 "vector_norm",
905 "vstack",
906 "w8a8_block_fp8_matmul",
907 "weight_norm_interface",
908 "weight_norm_interface_backward",
909 "where_scalar_other",
910 "where_scalar_self",
911 "where_self",
912 "where_self_out",
913 "zero",
914 "zero_",
915 "zero_out",
916 "zeros",
917 "zeros_like",
918]