Coverage for src/flag_gems/ops/__init__.py: 100%
291 statements
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-04 09:03 +0800
« prev ^ index » next coverage.py v7.6.9, created at 2026-06-04 09:03 +0800
1from flag_gems.ops._euclidean_dist import _euclidean_dist
2from flag_gems.ops._functional_sym_constrain_range_for_size import (
3 _functional_sym_constrain_range_for_size,
4)
5from flag_gems.ops._is_all_true import _is_all_true
6from flag_gems.ops._safe_softmax import _safe_softmax
7from flag_gems.ops._upsample_nearest_exact1d import _upsample_nearest_exact1d
8from flag_gems.ops.abs import abs, abs_
9from flag_gems.ops.absolute import absolute
10from flag_gems.ops.acos import acos
11from flag_gems.ops.act_quant import act_quant_triton
12from flag_gems.ops.add import add, add_
13from flag_gems.ops.addcdiv import addcdiv, addcdiv_out
14from flag_gems.ops.addcmul import addcmul, addcmul_out
15from flag_gems.ops.addmm import addmm, addmm_dtype, addmm_dtype_out, addmm_out
16from flag_gems.ops.addmv import addmv, addmv_out
17from flag_gems.ops.addr import addr
18from flag_gems.ops.affine_grid_generator import affine_grid_generator
19from flag_gems.ops.alias_copy import alias_copy, alias_copy_out
20from flag_gems.ops.all import all, all_dim, all_dims
21from flag_gems.ops.amax import amax
22from flag_gems.ops.aminmax import aminmax
23from flag_gems.ops.angle import angle
24from flag_gems.ops.any import any, any_dim, any_dims
25from flag_gems.ops.arange import arange, arange_start
26from flag_gems.ops.arcsinh import arcsinh, arcsinh_out
27from flag_gems.ops.arcsinh_ import arcsinh_
28from flag_gems.ops.arctanh_ import arctanh_
29from flag_gems.ops.argmax import argmax
30from flag_gems.ops.argmin import argmin
31from flag_gems.ops.argsort import argsort
32from flag_gems.ops.as_strided_copy import as_strided_copy, as_strided_copy_out
33from flag_gems.ops.asinh import asinh, asinh_out
34from flag_gems.ops.asinh_ import asinh_
35from flag_gems.ops.assert_async import _assert_async
36from flag_gems.ops.atan import atan, atan_
37from flag_gems.ops.atan2 import atan2, atan2_out
38from flag_gems.ops.attention import (
39 ScaleDotProductAttention,
40 flash_attention_forward,
41 flash_attn_varlen_func,
42 flash_attn_varlen_opt_func,
43 scaled_dot_product_attention,
44 scaled_dot_product_attention_backward,
45 scaled_dot_product_attention_forward,
46)
47from flag_gems.ops.avg_pool2d import avg_pool2d, avg_pool2d_backward
48from flag_gems.ops.avg_pool3d import avg_pool3d, avg_pool3d_backward
49from flag_gems.ops.baddbmm import baddbmm, baddbmm_out
50from flag_gems.ops.batch_norm import batch_norm, batch_norm_backward
51from flag_gems.ops.bernoulli_ import bernoulli_
52from flag_gems.ops.bincount import bincount
53from flag_gems.ops.bitwise_and import (
54 bitwise_and_scalar,
55 bitwise_and_scalar_,
56 bitwise_and_scalar_tensor,
57 bitwise_and_tensor,
58 bitwise_and_tensor_,
59)
60from flag_gems.ops.bitwise_left_shift import bitwise_left_shift
61from flag_gems.ops.bitwise_not import bitwise_not, bitwise_not_
62from flag_gems.ops.bitwise_or import (
63 bitwise_or_scalar,
64 bitwise_or_scalar_,
65 bitwise_or_scalar_tensor,
66 bitwise_or_tensor,
67 bitwise_or_tensor_,
68)
69from flag_gems.ops.bitwise_right_shift import bitwise_right_shift
70from flag_gems.ops.bmm import bmm, bmm_out
71from flag_gems.ops.cat import cat, cat_out
72from flag_gems.ops.cauchy import cauchy, cauchy_
73from flag_gems.ops.ceil import ceil, ceil_, ceil_out
74from flag_gems.ops.celu import celu, celu_
75from flag_gems.ops.clamp import (
76 clamp,
77 clamp_,
78 clamp_min,
79 clamp_min_,
80 clamp_tensor,
81 clamp_tensor_,
82)
83from flag_gems.ops.clamp_max import clamp_max, clamp_max_ # noqa: F401
84from flag_gems.ops.clip import clip, clip_
85from flag_gems.ops.col2im import col2im
86from flag_gems.ops.concatenate import concatenate
87from flag_gems.ops.conj_physical import conj_physical
88from flag_gems.ops.contiguous import contiguous
89from flag_gems.ops.conv1d import conv1d
90from flag_gems.ops.conv2d import conv2d
91from flag_gems.ops.conv3d import conv3d
92from flag_gems.ops.conv_depthwise2d import _conv_depthwise2d
93from flag_gems.ops.conv_transpose1d import conv_transpose1d
94from flag_gems.ops.conv_transpose2d import conv_transpose2d
95from flag_gems.ops.copy import copy, copy_
96from flag_gems.ops.copysign import copysign, copysign_out
97from flag_gems.ops.cos import cos, cos_
98from flag_gems.ops.cosh import cosh, cosh_, cosh_out
99from flag_gems.ops.count_nonzero import count_nonzero
100from flag_gems.ops.ctc_loss import ctc_loss
101from flag_gems.ops.cudnn_convolution import cudnn_convolution
102from flag_gems.ops.cummax import cummax
103from flag_gems.ops.cummin import cummin
104from flag_gems.ops.cumprod import cumprod, cumprod_
105from flag_gems.ops.cumsum import cumsum, cumsum_out, normed_cumsum
106from flag_gems.ops.diag import diag
107from flag_gems.ops.diag_embed import diag_embed
108from flag_gems.ops.diagonal import diagonal_backward
109from flag_gems.ops.diff import diff
110from flag_gems.ops.digamma_ import digamma_
111from flag_gems.ops.div import (
112 div_mode,
113 div_mode_,
114 floor_divide,
115 floor_divide_,
116 true_divide,
117 true_divide_,
118 true_divide_out,
119)
120from flag_gems.ops.dot import dot
121from flag_gems.ops.dropout import dropout, dropout_backward
122from flag_gems.ops.elu import elu, elu_, elu_backward
123from flag_gems.ops.embedding import embedding, embedding_backward
124from flag_gems.ops.embedding_dense_backward import embedding_dense_backward
125from flag_gems.ops.eq import eq, eq_scalar, equal
126from flag_gems.ops.erf import erf, erf_
127from flag_gems.ops.exp import exp, exp_, exp_out
128from flag_gems.ops.exp2 import exp2, exp2_
129from flag_gems.ops.expm1 import expm1, expm1_, expm1_out
130from flag_gems.ops.exponential_ import exponential_
131from flag_gems.ops.eye import eye
132from flag_gems.ops.eye_m import eye_m
133from flag_gems.ops.feature_dropout import feature_dropout, feature_dropout_
134from flag_gems.ops.fft import fft
135from flag_gems.ops.fill import (
136 fill_scalar,
137 fill_scalar_,
138 fill_scalar_out,
139 fill_tensor,
140 fill_tensor_,
141 fill_tensor_out,
142)
143from flag_gems.ops.flip import flip
144from flag_gems.ops.floor import floor, floor_out
145from flag_gems.ops.floor_ import floor_
146from flag_gems.ops.fmin import fmin, fmin_out
147from flag_gems.ops.fmod import fmod_scalar, fmod_scalar_, fmod_tensor, fmod_tensor_
148from flag_gems.ops.fp8_matmul import fp8_matmul
149from flag_gems.ops.fp8_mqa_logits import fp8_mqa_logits
150from flag_gems.ops.full import full
151from flag_gems.ops.full_like import full_like
152from flag_gems.ops.gather import gather, gather_backward
153from flag_gems.ops.gcd import gcd, gcd_out
154from flag_gems.ops.ge import ge, ge_scalar
155from flag_gems.ops.gelu import gelu, gelu_, gelu_backward
156from flag_gems.ops.get_paged_mqa_logits_metadata import get_paged_mqa_logits_metadata
157from flag_gems.ops.get_scheduler_metadata import get_scheduler_metadata
158from flag_gems.ops.glu import glu, glu_backward
159from flag_gems.ops.greater import (
160 greater,
161 greater_out,
162 greater_scalar,
163 greater_scalar_out,
164)
165from flag_gems.ops.grid_sample import grid_sample
166from flag_gems.ops.group_gemm import group_mm
167from flag_gems.ops.groupnorm import group_norm, group_norm_backward
168from flag_gems.ops.gt import gt, gt_scalar
169from flag_gems.ops.hadamard_transform import (
170 hadamard_transform,
171 hadamard_transform_12N,
172 hadamard_transform_20N,
173 hadamard_transform_28N,
174 hadamard_transform_40N,
175)
176from flag_gems.ops.hardsigmoid import hardsigmoid, hardsigmoid_out
177from flag_gems.ops.hardswish_ import hardswish_
178from flag_gems.ops.histc import histc
179from flag_gems.ops.hstack import hstack
180from flag_gems.ops.hypot import hypot, hypot_out
181from flag_gems.ops.i0 import i0, i0_out
182from flag_gems.ops.i0_ import i0_
183from flag_gems.ops.index import index
184from flag_gems.ops.index_add import index_add, index_add_
185from flag_gems.ops.index_copy_ import index_copy, index_copy_
186from flag_gems.ops.index_put import _index_put_impl_, index_put, index_put_
187from flag_gems.ops.index_select import index_select
188from flag_gems.ops.isclose import allclose, isclose
189from flag_gems.ops.isfinite import isfinite
190from flag_gems.ops.isin import isin
191from flag_gems.ops.isinf import isinf
192from flag_gems.ops.isnan import isnan
193from flag_gems.ops.isneginf import isneginf, isneginf_out
194from flag_gems.ops.kron import kron
195from flag_gems.ops.layernorm import layer_norm, layer_norm_backward
196from flag_gems.ops.le import le, le_scalar
197from flag_gems.ops.leaky_relu import leaky_relu, leaky_relu_, leaky_relu_out
198from flag_gems.ops.lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_
199from flag_gems.ops.lift_fresh_copy import lift_fresh_copy, lift_fresh_copy_out
200from flag_gems.ops.linspace import linspace
201from flag_gems.ops.log import log
202from flag_gems.ops.log1p import log1p
203from flag_gems.ops.log1p_ import log1p_
204from flag_gems.ops.log10 import log10, log10_, log10_out
205from flag_gems.ops.log_sigmoid import log_sigmoid
206from flag_gems.ops.log_softmax import (
207 log_softmax,
208 log_softmax_backward,
209 log_softmax_backward_out,
210 log_softmax_out,
211)
212from flag_gems.ops.logaddexp import logaddexp, logaddexp_out
213from flag_gems.ops.logical_and import logical_and, logical_and_
214from flag_gems.ops.logical_not import logical_not
215from flag_gems.ops.logical_or import logical_or, logical_or_
216from flag_gems.ops.logical_xor import logical_xor
217from flag_gems.ops.logit import logit, logit_out
218from flag_gems.ops.logit_ import logit_
219from flag_gems.ops.logspace import logspace
220from flag_gems.ops.logsumexp import logsumexp
221from flag_gems.ops.lt import lt, lt_scalar
222from flag_gems.ops.margin_ranking_loss import margin_ranking_loss
223from flag_gems.ops.masked_fill import masked_fill, masked_fill_
224from flag_gems.ops.masked_scatter import masked_scatter, masked_scatter_
225from flag_gems.ops.masked_select import masked_select
226from flag_gems.ops.max import max, max_dim
227from flag_gems.ops.max_pool2d_with_indices import (
228 max_pool2d_backward,
229 max_pool2d_with_indices,
230)
231from flag_gems.ops.max_pool3d_with_indices import (
232 max_pool3d_backward,
233 max_pool3d_with_indices,
234)
235from flag_gems.ops.maximum import maximum
236from flag_gems.ops.mean import mean, mean_dim
237from flag_gems.ops.median import median, median_dim, median_dim_values, median_out
238from flag_gems.ops.min import min, min_dim
239from flag_gems.ops.minimum import minimum
240from flag_gems.ops.mm import mm, mm_out, router_gemm
241from flag_gems.ops.mse_loss import mse_loss
242from flag_gems.ops.mul import mul, mul_
243from flag_gems.ops.multinomial import multinomial
244from flag_gems.ops.mv import mv
245from flag_gems.ops.nan_to_num import nan_to_num
246from flag_gems.ops.ne import ne, ne_scalar
247from flag_gems.ops.neg import neg, neg_
248from flag_gems.ops.new_full import new_full
249from flag_gems.ops.nll_loss_nd import nll_loss_nd_backward, nll_loss_nd_forward
250from flag_gems.ops.nllloss import (
251 nll_loss2d_backward,
252 nll_loss2d_forward,
253 nll_loss_backward,
254 nll_loss_forward,
255)
256from flag_gems.ops.nonzero import nonzero
257from flag_gems.ops.nonzero_numpy import nonzero_numpy
258from flag_gems.ops.normal import (
259 normal_,
260 normal_float_tensor,
261 normal_tensor_float,
262 normal_tensor_tensor,
263)
264from flag_gems.ops.one_hot import one_hot
265from flag_gems.ops.ones import ones
266from flag_gems.ops.ones_like import ones_like
267from flag_gems.ops.pad import constant_pad_nd, pad
268from flag_gems.ops.per_token_group_quant_fp8 import (
269 SUPPORTED_FP8_DTYPE,
270 per_token_group_quant_fp8,
271)
272from flag_gems.ops.pixel_shuffle import pixel_shuffle
273from flag_gems.ops.pixel_unshuffle import pixel_unshuffle, pixel_unshuffle_out
274from flag_gems.ops.poisson import poisson
275from flag_gems.ops.polar import polar
276from flag_gems.ops.pow import (
277 pow_scalar,
278 pow_tensor_scalar,
279 pow_tensor_scalar_,
280 pow_tensor_tensor,
281 pow_tensor_tensor_,
282)
283from flag_gems.ops.prelu import prelu
284from flag_gems.ops.prod import prod, prod_dim
285from flag_gems.ops.quantile import quantile
286from flag_gems.ops.rad2deg import rad2deg, rad2deg_
287from flag_gems.ops.rand import rand
288from flag_gems.ops.rand_like import rand_like
289from flag_gems.ops.randint import randint
290from flag_gems.ops.randn import randn
291from flag_gems.ops.randn_like import randn_like
292from flag_gems.ops.randperm import randperm
293from flag_gems.ops.reciprocal import reciprocal, reciprocal_
294from flag_gems.ops.reflection_pad1d import reflection_pad1d, reflection_pad1d_out
295from flag_gems.ops.reflection_pad1d_backward import reflection_pad1d_backward
296from flag_gems.ops.reflection_pad2d import reflection_pad2d, reflection_pad2d_out
297from flag_gems.ops.relu import relu, relu_
298from flag_gems.ops.relu6 import relu6
299from flag_gems.ops.remainder import remainder, remainder_
300from flag_gems.ops.repeat import repeat
301from flag_gems.ops.repeat_interleave import (
302 repeat_interleave_self_int,
303 repeat_interleave_self_tensor,
304 repeat_interleave_tensor,
305)
306from flag_gems.ops.replication_pad1d import replication_pad1d, replication_pad1d_out
307from flag_gems.ops.replication_pad3d import replication_pad3d
308from flag_gems.ops.resolve_conj import resolve_conj
309from flag_gems.ops.resolve_neg import resolve_neg
310from flag_gems.ops.rms_norm import rms_norm, rms_norm_backward, rms_norm_forward
311from flag_gems.ops.roll import roll
312from flag_gems.ops.round import round, round_, round_out
313from flag_gems.ops.rrelu_with_noise_backward import rrelu_with_noise_backward
314from flag_gems.ops.rsqrt import rsqrt, rsqrt_
315from flag_gems.ops.rsub import rsub_scalar, rsub_tensor
316from flag_gems.ops.scaled_mm import scaled_mm, scaled_mm_out
317from flag_gems.ops.scaled_softmax import scaled_softmax_backward, scaled_softmax_forward
318from flag_gems.ops.scatter import scatter, scatter_
319from flag_gems.ops.scatter_add_ import scatter_add_
320from flag_gems.ops.scatter_reduce import (
321 scatter_reduce,
322 scatter_reduce_,
323 scatter_reduce_out,
324)
325from flag_gems.ops.select_backward import select_backward
326from flag_gems.ops.select_scatter import select_scatter
327from flag_gems.ops.selu import selu
328from flag_gems.ops.selu_ import selu_
329from flag_gems.ops.sgn_ import sgn_
330from flag_gems.ops.sigmoid import sigmoid, sigmoid_, sigmoid_backward
331from flag_gems.ops.signbit import signbit, signbit_out
332from flag_gems.ops.silu import silu, silu_, silu_backward
333from flag_gems.ops.sin import sin, sin_
334from flag_gems.ops.sinh_ import sinh_
335from flag_gems.ops.slice_backward import slice_backward
336from flag_gems.ops.slice_scatter import slice_scatter
337from flag_gems.ops.smooth_l1_loss import (
338 smooth_l1_loss,
339 smooth_l1_loss_backward,
340 smooth_l1_loss_out,
341)
342from flag_gems.ops.soft_margin_loss import soft_margin_loss, soft_margin_loss_out
343from flag_gems.ops.softmax import (
344 softmax,
345 softmax_backward,
346 softmax_backward_out,
347 softmax_out,
348)
349from flag_gems.ops.softplus import softplus
350from flag_gems.ops.softshrink import softshrink, softshrink_out
351from flag_gems.ops.sort import sort, sort_stable
352from flag_gems.ops.special_i0e import special_i0e, special_i0e_out
353from flag_gems.ops.special_i1 import special_i1, special_i1_out
354from flag_gems.ops.sqrt import sqrt, sqrt_
355from flag_gems.ops.square import square, square_, square_out
356from flag_gems.ops.stack import stack
357from flag_gems.ops.std import std
358from flag_gems.ops.sub import sub, sub_
359from flag_gems.ops.sum import sum, sum_dim, sum_dim_out, sum_out
360from flag_gems.ops.svd import svd
361from flag_gems.ops.t_copy import t_copy, t_copy_out
362from flag_gems.ops.tan import tan, tan_
363from flag_gems.ops.tanh import tanh, tanh_, tanh_backward
364from flag_gems.ops.threshold import threshold, threshold_backward
365from flag_gems.ops.tile import tile
366from flag_gems.ops.to import to_copy
367from flag_gems.ops.topk import topk
368from flag_gems.ops.trace import trace
369from flag_gems.ops.tril import tril, tril_, tril_out
370from flag_gems.ops.triu import triu, triu_
371from flag_gems.ops.unfold_backward import unfold_backward
372from flag_gems.ops.uniform import uniform_
373from flag_gems.ops.unique import _unique2
374from flag_gems.ops.unique_consecutive import unique_consecutive
375from flag_gems.ops.upsample_bicubic2d import upsample_bicubic2d
376from flag_gems.ops.upsample_bicubic2d_aa import _upsample_bicubic2d_aa
377from flag_gems.ops.upsample_bicubic2d_aa_backward import _upsample_bicubic2d_aa_backward
378from flag_gems.ops.upsample_linear1d import upsample_linear1d
379from flag_gems.ops.upsample_nearest1d import upsample_nearest1d
380from flag_gems.ops.upsample_nearest2d import upsample_nearest2d
381from flag_gems.ops.upsample_nearest3d import upsample_nearest3d
382from flag_gems.ops.var import var, var_correction, var_dim
383from flag_gems.ops.var_mean import var_mean
384from flag_gems.ops.vdot import vdot
385from flag_gems.ops.vector_norm import vector_norm
386from flag_gems.ops.vstack import vstack
387from flag_gems.ops.w8a8_block_fp8_matmul import w8a8_block_fp8_matmul
388from flag_gems.ops.weightnorm import (
389 weight_norm_interface,
390 weight_norm_interface_backward,
391)
392from flag_gems.ops.where import (
393 where_scalar_other,
394 where_scalar_self,
395 where_self,
396 where_self_out,
397)
398from flag_gems.ops.zero import zero, zero_out
399from flag_gems.ops.zeros import zero_, zeros
400from flag_gems.ops.zeros_like import zeros_like
402__all__ = [
403 "_assert_async",
404 "_conv_depthwise2d",
405 "_euclidean_dist",
406 "_functional_sym_constrain_range_for_size",
407 "_index_put_impl_",
408 "_is_all_true",
409 "_safe_softmax",
410 "_unique2",
411 "_upsample_bicubic2d_aa",
412 "_upsample_bicubic2d_aa_backward",
413 "_upsample_nearest_exact1d",
414 "abs",
415 "abs_",
416 "absolute",
417 "acos",
418 "act_quant_triton",
419 "add",
420 "add_",
421 "addcdiv",
422 "addcdiv_out",
423 "addcmul",
424 "addcmul_out",
425 "addmm",
426 "addmm_dtype",
427 "addmm_dtype_out",
428 "addmm_out",
429 "addmv",
430 "addmv_out",
431 "addr",
432 "affine_grid_generator",
433 "alias_copy",
434 "alias_copy_out",
435 "all",
436 "all_dim",
437 "all_dims",
438 "allclose",
439 "amax",
440 "aminmax",
441 "angle",
442 "any",
443 "any_dim",
444 "any_dims",
445 "arange",
446 "arange_start",
447 "arcsinh",
448 "arcsinh_",
449 "arcsinh_out",
450 "arctanh_",
451 "argmax",
452 "argmin",
453 "argsort",
454 "as_strided_copy",
455 "as_strided_copy_out",
456 "asinh",
457 "asinh_",
458 "asinh_out",
459 "atan",
460 "atan2",
461 "atan2_out",
462 "atan_",
463 "avg_pool2d",
464 "avg_pool2d_backward",
465 "avg_pool3d",
466 "avg_pool3d_backward",
467 "baddbmm",
468 "baddbmm_out",
469 "batch_norm",
470 "batch_norm_backward",
471 "bernoulli_",
472 "bincount",
473 "bitwise_and_scalar",
474 "bitwise_and_scalar_",
475 "bitwise_and_scalar_tensor",
476 "bitwise_and_tensor",
477 "bitwise_and_tensor_",
478 "bitwise_left_shift",
479 "bitwise_not",
480 "bitwise_not_",
481 "bitwise_or_scalar",
482 "bitwise_or_scalar_",
483 "bitwise_or_scalar_tensor",
484 "bitwise_or_tensor",
485 "bitwise_or_tensor_",
486 "bitwise_right_shift",
487 "bmm",
488 "bmm_out",
489 "cat",
490 "cat_out",
491 "cauchy",
492 "cauchy_",
493 "ceil",
494 "ceil_",
495 "ceil_out",
496 "celu",
497 "celu_",
498 "clamp",
499 "clamp_",
500 "clamp_max",
501 "clamp_max_",
502 "clamp_min",
503 "clamp_min_",
504 "clamp_tensor",
505 "clamp_tensor_",
506 "clip",
507 "clip_",
508 "col2im",
509 "concatenate",
510 "conj_physical",
511 "constant_pad_nd",
512 "contiguous",
513 "conv1d",
514 "conv2d",
515 "conv3d",
516 "conv_transpose1d",
517 "conv_transpose2d",
518 "copy",
519 "copy_",
520 "copysign",
521 "copysign_out",
522 "cos",
523 "cos_",
524 "cosh",
525 "cosh_",
526 "cosh_out",
527 "count_nonzero",
528 "ctc_loss",
529 "cudnn_convolution",
530 "cummax",
531 "cummin",
532 "cumprod",
533 "cumprod_",
534 "cumsum",
535 "cumsum_out",
536 "diag",
537 "diag_embed",
538 "diagonal_backward",
539 "diff",
540 "digamma_",
541 "div_mode",
542 "div_mode_",
543 "dot",
544 "dropout",
545 "dropout_backward",
546 "elu",
547 "elu_",
548 "elu_backward",
549 "embedding",
550 "embedding_backward",
551 "embedding_dense_backward",
552 "eq",
553 "eq_scalar",
554 "equal",
555 "erf",
556 "erf_",
557 "exp",
558 "exp2",
559 "exp2_",
560 "exp_",
561 "exp_out",
562 "expm1",
563 "expm1_",
564 "expm1_out",
565 "exponential_",
566 "eye",
567 "eye_m",
568 "feature_dropout",
569 "feature_dropout_",
570 "fft",
571 "fill_scalar",
572 "fill_scalar_",
573 "fill_scalar_out",
574 "fill_tensor",
575 "fill_tensor_",
576 "fill_tensor_out",
577 "flash_attention_forward",
578 "flash_attn_varlen_func",
579 "flash_attn_varlen_opt_func",
580 "flip",
581 "floor",
582 "floor_",
583 "floor_out",
584 "floor_divide",
585 "floor_divide_",
586 "fmin",
587 "fmin_out",
588 "fmod_scalar",
589 "fmod_scalar_",
590 "fmod_tensor",
591 "fmod_tensor_",
592 "fp8_matmul",
593 "fp8_mqa_logits",
594 "full",
595 "full_like",
596 "gather",
597 "gather_backward",
598 "gcd",
599 "gcd_out",
600 "ge",
601 "ge_scalar",
602 "gelu",
603 "gelu_",
604 "gelu_backward",
605 "get_paged_mqa_logits_metadata",
606 "get_scheduler_metadata",
607 "glu",
608 "glu_backward",
609 "greater",
610 "greater_out",
611 "greater_scalar",
612 "greater_scalar_out",
613 "grid_sample",
614 "group_mm",
615 "group_norm",
616 "group_norm_backward",
617 "gt",
618 "gt_scalar",
619 "hadamard_transform",
620 "hadamard_transform_12N",
621 "hadamard_transform_20N",
622 "hadamard_transform_28N",
623 "hadamard_transform_40N",
624 "hardsigmoid",
625 "hardsigmoid_out",
626 "hardswish_",
627 "histc",
628 "hstack",
629 "hypot",
630 "hypot_out",
631 "i0",
632 "i0_",
633 "i0_out",
634 "index",
635 "index_add",
636 "index_add_",
637 "index_copy",
638 "index_copy_",
639 "index_put",
640 "index_put_",
641 "index_select",
642 "isclose",
643 "isfinite",
644 "isin",
645 "isinf",
646 "isnan",
647 "isneginf",
648 "isneginf_out",
649 "kron",
650 "layer_norm",
651 "layer_norm_backward",
652 "le",
653 "le_scalar",
654 "leaky_relu",
655 "leaky_relu_",
656 "leaky_relu_out",
657 "lerp_scalar",
658 "lerp_scalar_",
659 "lerp_tensor",
660 "lerp_tensor_",
661 "lift_fresh_copy",
662 "lift_fresh_copy_out",
663 "linspace",
664 "log",
665 "log10",
666 "log10_",
667 "log10_out",
668 "log1p_",
669 "log_sigmoid",
670 "log_softmax",
671 "log_softmax_backward",
672 "log_softmax_backward_out",
673 "log_softmax_out",
674 "log1p",
675 "log1p_",
676 "logaddexp",
677 "logaddexp_out",
678 "logical_and",
679 "logical_and_",
680 "logical_not",
681 "logical_or",
682 "logical_or_",
683 "logical_xor",
684 "logit",
685 "logit_",
686 "logit_out",
687 "logspace",
688 "logsumexp",
689 "lt",
690 "lt_scalar",
691 "margin_ranking_loss",
692 "masked_fill",
693 "masked_fill_",
694 "masked_scatter",
695 "masked_scatter_",
696 "masked_select",
697 "max",
698 "max_dim",
699 "max_pool2d_backward",
700 "max_pool2d_with_indices",
701 "max_pool3d_backward",
702 "max_pool3d_with_indices",
703 "maximum",
704 "mean",
705 "mean_dim",
706 "median",
707 "median_dim",
708 "median_dim_values",
709 "median_out",
710 "min",
711 "min_dim",
712 "minimum",
713 "mm",
714 "mm_out",
715 "mse_loss",
716 "mul",
717 "mul_",
718 "multinomial",
719 "mv",
720 "nan_to_num",
721 "ne",
722 "ne_scalar",
723 "neg",
724 "neg_",
725 "new_full",
726 "nll_loss2d_backward",
727 "nll_loss2d_forward",
728 "nll_loss_backward",
729 "nll_loss_forward",
730 "nll_loss_nd_backward",
731 "nll_loss_nd_forward",
732 "nonzero",
733 "nonzero_numpy",
734 "normal_",
735 "normal_float_tensor",
736 "normal_tensor_float",
737 "normal_tensor_tensor",
738 "normed_cumsum",
739 "one_hot",
740 "ones",
741 "ones_like",
742 "pad",
743 "per_token_group_quant_fp8",
744 "pixel_shuffle",
745 "pixel_unshuffle",
746 "pixel_unshuffle_out",
747 "poisson",
748 "polar",
749 "pow_scalar",
750 "pow_tensor_scalar",
751 "pow_tensor_scalar_",
752 "pow_tensor_tensor",
753 "pow_tensor_tensor_",
754 "prelu",
755 "prod",
756 "prod_dim",
757 "quantile",
758 "rad2deg",
759 "rad2deg_",
760 "rand",
761 "rand_like",
762 "randint",
763 "randn",
764 "randn_like",
765 "randperm",
766 "reciprocal",
767 "reciprocal_",
768 "reflection_pad1d",
769 "reflection_pad1d_backward",
770 "reflection_pad1d_out",
771 "reflection_pad2d",
772 "reflection_pad2d_out",
773 "relu",
774 "relu6",
775 "relu_",
776 "remainder",
777 "remainder_",
778 "repeat",
779 "repeat_interleave_self_int",
780 "repeat_interleave_self_tensor",
781 "repeat_interleave_tensor",
782 "replication_pad1d",
783 "replication_pad1d_out",
784 "replication_pad3d",
785 "resolve_conj",
786 "resolve_neg",
787 "rms_norm",
788 "rms_norm_backward",
789 "rms_norm_forward",
790 "roll",
791 "round",
792 "round_",
793 "round_out",
794 "router_gemm",
795 "rrelu_with_noise_backward",
796 "rsqrt",
797 "rsqrt_",
798 "rsub_scalar",
799 "rsub_tensor",
800 "scaled_dot_product_attention",
801 "scaled_dot_product_attention_backward",
802 "scaled_dot_product_attention_forward",
803 "scaled_mm",
804 "scaled_mm_out",
805 "scaled_softmax_backward",
806 "scaled_softmax_forward",
807 "ScaleDotProductAttention",
808 "scatter",
809 "scatter_",
810 "scatter_add_",
811 "scatter_reduce",
812 "scatter_reduce_",
813 "scatter_reduce_out",
814 "select_backward",
815 "select_scatter",
816 "selu",
817 "selu_",
818 "sgn_",
819 "sigmoid",
820 "sigmoid_",
821 "sigmoid_backward",
822 "signbit",
823 "signbit_out",
824 "silu",
825 "silu_",
826 "silu_backward",
827 "sin",
828 "sin_",
829 "sinh_",
830 "slice_backward",
831 "slice_scatter",
832 "smooth_l1_loss",
833 "smooth_l1_loss_backward",
834 "smooth_l1_loss_out",
835 "soft_margin_loss",
836 "soft_margin_loss_out",
837 "softmax",
838 "softmax_backward",
839 "softmax_backward_out",
840 "softmax_out",
841 "softplus",
842 "softshrink",
843 "softshrink_out",
844 "sort",
845 "sort_stable",
846 "special_i0e",
847 "special_i0e_out",
848 "special_i1",
849 "special_i1_out",
850 "sqrt",
851 "sqrt_",
852 "square",
853 "square_",
854 "square_out",
855 "stack",
856 "std",
857 "sub",
858 "sub_",
859 "sum",
860 "sum_dim",
861 "sum_dim_out",
862 "sum_out",
863 "SUPPORTED_FP8_DTYPE",
864 "svd",
865 "t_copy",
866 "t_copy_out",
867 "tan",
868 "tan_",
869 "tanh",
870 "tanh_",
871 "tanh_backward",
872 "threshold",
873 "threshold_backward",
874 "tile",
875 "to_copy",
876 "topk",
877 "trace",
878 "tril",
879 "tril_",
880 "tril_out",
881 "triu",
882 "triu_",
883 "true_divide",
884 "true_divide_",
885 "true_divide_out",
886 "unfold_backward",
887 "uniform_",
888 "unique_consecutive",
889 "upsample_bicubic2d",
890 "upsample_linear1d",
891 "upsample_nearest1d",
892 "upsample_nearest2d",
893 "upsample_nearest3d",
894 "var",
895 "var_correction",
896 "var_dim",
897 "var_mean",
898 "vdot",
899 "vector_norm",
900 "vstack",
901 "w8a8_block_fp8_matmul",
902 "weight_norm_interface",
903 "weight_norm_interface_backward",
904 "where_scalar_other",
905 "where_scalar_self",
906 "where_self",
907 "where_self_out",
908 "zero",
909 "zero_",
910 "zero_out",
911 "zeros",
912 "zeros_like",
913]