Coverage for src/flag_gems/ops/__init__.py: 100%
255 statements
« prev ^ index » next coverage.py v7.6.9, created at 2026-05-06 06:51 +0800
« prev ^ index » next coverage.py v7.6.9, created at 2026-05-06 06:51 +0800
1from flag_gems.ops._functional_sym_constrain_range_for_size import (
2 _functional_sym_constrain_range_for_size,
3)
4from flag_gems.ops._is_all_true import _is_all_true
5from flag_gems.ops._safe_softmax import _safe_softmax
6from flag_gems.ops._upsample_nearest_exact1d import _upsample_nearest_exact1d
7from flag_gems.ops.abs import abs, abs_
8from flag_gems.ops.absolute import absolute
9from flag_gems.ops.acos import acos
10from flag_gems.ops.act_quant import act_quant_triton
11from flag_gems.ops.add import add, add_
12from flag_gems.ops.addcdiv import addcdiv, addcdiv_out
13from flag_gems.ops.addcmul import addcmul, addcmul_out
14from flag_gems.ops.addmm import addmm, addmm_dtype, addmm_dtype_out, addmm_out
15from flag_gems.ops.addmv import addmv, addmv_out
16from flag_gems.ops.addr import addr
17from flag_gems.ops.alias_copy import alias_copy, alias_copy_out
18from flag_gems.ops.all import all, all_dim, all_dims
19from flag_gems.ops.amax import amax
20from flag_gems.ops.aminmax import aminmax
21from flag_gems.ops.angle import angle
22from flag_gems.ops.any import any, any_dim, any_dims
23from flag_gems.ops.arange import arange, arange_start
24from flag_gems.ops.arcsinh import arcsinh, arcsinh_out
25from flag_gems.ops.arcsinh_ import arcsinh_
26from flag_gems.ops.arctanh_ import arctanh_
27from flag_gems.ops.argmax import argmax
28from flag_gems.ops.argmin import argmin
29from flag_gems.ops.asinh import asinh, asinh_out
30from flag_gems.ops.asinh_ import asinh_
31from flag_gems.ops.assert_async import _assert_async
32from flag_gems.ops.atan import atan, atan_
33from flag_gems.ops.atan2 import atan2, atan2_out
34from flag_gems.ops.attention import (
35 ScaleDotProductAttention,
36 flash_attention_forward,
37 flash_attn_varlen_func,
38 flash_attn_varlen_opt_func,
39 scaled_dot_product_attention,
40 scaled_dot_product_attention_backward,
41 scaled_dot_product_attention_forward,
42)
43from flag_gems.ops.avg_pool2d import avg_pool2d, avg_pool2d_backward
44from flag_gems.ops.avg_pool3d import avg_pool3d, avg_pool3d_backward
45from flag_gems.ops.baddbmm import baddbmm, baddbmm_out
46from flag_gems.ops.batch_norm import batch_norm, batch_norm_backward
47from flag_gems.ops.bernoulli_ import bernoulli_
48from flag_gems.ops.bitwise_and import (
49 bitwise_and_scalar,
50 bitwise_and_scalar_,
51 bitwise_and_scalar_tensor,
52 bitwise_and_tensor,
53 bitwise_and_tensor_,
54)
55from flag_gems.ops.bitwise_left_shift import bitwise_left_shift
56from flag_gems.ops.bitwise_not import bitwise_not, bitwise_not_
57from flag_gems.ops.bitwise_or import (
58 bitwise_or_scalar,
59 bitwise_or_scalar_,
60 bitwise_or_scalar_tensor,
61 bitwise_or_tensor,
62 bitwise_or_tensor_,
63)
64from flag_gems.ops.bitwise_right_shift import bitwise_right_shift
65from flag_gems.ops.bmm import bmm, bmm_out
66from flag_gems.ops.cat import cat, cat_out
67from flag_gems.ops.ceil import ceil, ceil_, ceil_out
68from flag_gems.ops.celu import celu, celu_
69from flag_gems.ops.clamp import (
70 clamp,
71 clamp_,
72 clamp_min,
73 clamp_min_,
74 clamp_tensor,
75 clamp_tensor_,
76)
77from flag_gems.ops.clip import clip, clip_
78from flag_gems.ops.conj_physical import conj_physical
79from flag_gems.ops.contiguous import contiguous
80from flag_gems.ops.conv1d import conv1d
81from flag_gems.ops.conv2d import conv2d
82from flag_gems.ops.conv3d import conv3d
83from flag_gems.ops.conv_depthwise2d import _conv_depthwise2d
84from flag_gems.ops.copy import copy, copy_
85from flag_gems.ops.copysign import copysign, copysign_out
86from flag_gems.ops.cos import cos, cos_
87from flag_gems.ops.cosh import cosh, cosh_, cosh_out
88from flag_gems.ops.count_nonzero import count_nonzero
89from flag_gems.ops.cummax import cummax
90from flag_gems.ops.cummin import cummin
91from flag_gems.ops.cumsum import cumsum, cumsum_out, normed_cumsum
92from flag_gems.ops.diag import diag
93from flag_gems.ops.diag_embed import diag_embed
94from flag_gems.ops.diagonal import diagonal_backward
95from flag_gems.ops.digamma_ import digamma_
96from flag_gems.ops.div import (
97 div_mode,
98 div_mode_,
99 floor_divide,
100 floor_divide_,
101 remainder,
102 remainder_,
103 true_divide,
104 true_divide_,
105 true_divide_out,
106)
107from flag_gems.ops.dot import dot
108from flag_gems.ops.dropout import dropout, dropout_backward
109from flag_gems.ops.elu import elu, elu_, elu_backward
110from flag_gems.ops.embedding import embedding, embedding_backward
111from flag_gems.ops.embedding_dense_backward import embedding_dense_backward
112from flag_gems.ops.eq import eq, eq_scalar, equal
113from flag_gems.ops.erf import erf, erf_
114from flag_gems.ops.exp import exp, exp_, exp_out
115from flag_gems.ops.exp2 import exp2, exp2_
116from flag_gems.ops.expm1 import expm1, expm1_, expm1_out
117from flag_gems.ops.exponential_ import exponential_
118from flag_gems.ops.eye import eye
119from flag_gems.ops.eye_m import eye_m
120from flag_gems.ops.fill import (
121 fill_scalar,
122 fill_scalar_,
123 fill_scalar_out,
124 fill_tensor,
125 fill_tensor_,
126 fill_tensor_out,
127)
128from flag_gems.ops.flip import flip
129from flag_gems.ops.floor_ import floor_
130from flag_gems.ops.fmin import fmin, fmin_out
131from flag_gems.ops.fp8_matmul import fp8_matmul
132from flag_gems.ops.full import full
133from flag_gems.ops.full_like import full_like
134from flag_gems.ops.gather import gather, gather_backward
135from flag_gems.ops.gcd import gcd, gcd_out
136from flag_gems.ops.ge import ge, ge_scalar
137from flag_gems.ops.gelu import gelu, gelu_, gelu_backward
138from flag_gems.ops.get_paged_mqa_logits_metadata import get_paged_mqa_logits_metadata
139from flag_gems.ops.get_scheduler_metadata import get_scheduler_metadata
140from flag_gems.ops.glu import glu, glu_backward
141from flag_gems.ops.greater import (
142 greater,
143 greater_out,
144 greater_scalar,
145 greater_scalar_out,
146)
147from flag_gems.ops.grid_sample import grid_sample
148from flag_gems.ops.group_gemm import group_mm
149from flag_gems.ops.groupnorm import group_norm, group_norm_backward
150from flag_gems.ops.gt import gt, gt_scalar
151from flag_gems.ops.hadamard_transform import hadamard_transform
152from flag_gems.ops.hardsigmoid import hardsigmoid, hardsigmoid_out
153from flag_gems.ops.hardswish_ import hardswish_
154from flag_gems.ops.hstack import hstack
155from flag_gems.ops.hypot import hypot, hypot_out
156from flag_gems.ops.i0 import i0, i0_out
157from flag_gems.ops.i0_ import i0_
158from flag_gems.ops.index import index
159from flag_gems.ops.index_add import index_add, index_add_
160from flag_gems.ops.index_put import _index_put_impl_, index_put, index_put_
161from flag_gems.ops.index_select import index_select
162from flag_gems.ops.isclose import allclose, isclose
163from flag_gems.ops.isfinite import isfinite
164from flag_gems.ops.isin import isin
165from flag_gems.ops.isinf import isinf
166from flag_gems.ops.isnan import isnan
167from flag_gems.ops.isneginf import isneginf, isneginf_out
168from flag_gems.ops.kron import kron
169from flag_gems.ops.layernorm import layer_norm, layer_norm_backward
170from flag_gems.ops.le import le, le_scalar
171from flag_gems.ops.leaky_relu import leaky_relu, leaky_relu_, leaky_relu_out
172from flag_gems.ops.lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_
173from flag_gems.ops.lift_fresh_copy import lift_fresh_copy, lift_fresh_copy_out
174from flag_gems.ops.linspace import linspace
175from flag_gems.ops.log import log
176from flag_gems.ops.log1p_ import log1p_
177from flag_gems.ops.log10 import log10, log10_, log10_out
178from flag_gems.ops.log_sigmoid import log_sigmoid
179from flag_gems.ops.log_softmax import (
180 log_softmax,
181 log_softmax_backward,
182 log_softmax_backward_out,
183 log_softmax_out,
184)
185from flag_gems.ops.logaddexp import logaddexp, logaddexp_out
186from flag_gems.ops.logical_and import logical_and, logical_and_
187from flag_gems.ops.logical_not import logical_not
188from flag_gems.ops.logical_or import logical_or, logical_or_
189from flag_gems.ops.logical_xor import logical_xor
190from flag_gems.ops.logit import logit, logit_out
191from flag_gems.ops.logit_ import logit_
192from flag_gems.ops.logspace import logspace
193from flag_gems.ops.lt import lt, lt_scalar
194from flag_gems.ops.margin_ranking_loss import margin_ranking_loss
195from flag_gems.ops.masked_fill import masked_fill, masked_fill_
196from flag_gems.ops.masked_scatter import masked_scatter, masked_scatter_
197from flag_gems.ops.masked_select import masked_select
198from flag_gems.ops.max import max, max_dim
199from flag_gems.ops.max_pool2d_with_indices import (
200 max_pool2d_backward,
201 max_pool2d_with_indices,
202)
203from flag_gems.ops.max_pool3d_with_indices import (
204 max_pool3d_backward,
205 max_pool3d_with_indices,
206)
207from flag_gems.ops.maximum import maximum
208from flag_gems.ops.mean import mean, mean_dim
209from flag_gems.ops.min import min, min_dim
210from flag_gems.ops.minimum import minimum
211from flag_gems.ops.mm import mm, mm_out
212from flag_gems.ops.mse_loss import mse_loss
213from flag_gems.ops.mul import mul, mul_
214from flag_gems.ops.multinomial import multinomial
215from flag_gems.ops.mv import mv
216from flag_gems.ops.nan_to_num import nan_to_num
217from flag_gems.ops.ne import ne, ne_scalar
218from flag_gems.ops.neg import neg, neg_
219from flag_gems.ops.new_full import new_full
220from flag_gems.ops.nll_loss_nd import nll_loss_nd_backward, nll_loss_nd_forward
221from flag_gems.ops.nllloss import (
222 nll_loss2d_backward,
223 nll_loss2d_forward,
224 nll_loss_backward,
225 nll_loss_forward,
226)
227from flag_gems.ops.nonzero import nonzero
228from flag_gems.ops.normal import (
229 normal_,
230 normal_float_tensor,
231 normal_tensor_float,
232 normal_tensor_tensor,
233)
234from flag_gems.ops.one_hot import one_hot
235from flag_gems.ops.ones import ones
236from flag_gems.ops.ones_like import ones_like
237from flag_gems.ops.pad import constant_pad_nd, pad
238from flag_gems.ops.per_token_group_quant_fp8 import (
239 SUPPORTED_FP8_DTYPE,
240 per_token_group_quant_fp8,
241)
242from flag_gems.ops.pixel_shuffle import pixel_shuffle
243from flag_gems.ops.pixel_unshuffle import pixel_unshuffle, pixel_unshuffle_out
244from flag_gems.ops.polar import polar
245from flag_gems.ops.pow import (
246 pow_scalar,
247 pow_tensor_scalar,
248 pow_tensor_scalar_,
249 pow_tensor_tensor,
250 pow_tensor_tensor_,
251)
252from flag_gems.ops.prelu import prelu
253from flag_gems.ops.prod import prod, prod_dim
254from flag_gems.ops.quantile import quantile
255from flag_gems.ops.rand import rand
256from flag_gems.ops.rand_like import rand_like
257from flag_gems.ops.randn import randn
258from flag_gems.ops.randn_like import randn_like
259from flag_gems.ops.randperm import randperm
260from flag_gems.ops.reciprocal import reciprocal, reciprocal_
261from flag_gems.ops.reflection_pad1d import reflection_pad1d, reflection_pad1d_out
262from flag_gems.ops.reflection_pad2d import reflection_pad2d, reflection_pad2d_out
263from flag_gems.ops.relu import relu, relu_
264from flag_gems.ops.relu6 import relu6
265from flag_gems.ops.repeat import repeat
266from flag_gems.ops.repeat_interleave import (
267 repeat_interleave_self_int,
268 repeat_interleave_self_tensor,
269 repeat_interleave_tensor,
270)
271from flag_gems.ops.replication_pad1d import replication_pad1d, replication_pad1d_out
272from flag_gems.ops.replication_pad3d import replication_pad3d
273from flag_gems.ops.resolve_conj import resolve_conj
274from flag_gems.ops.resolve_neg import resolve_neg
275from flag_gems.ops.rms_norm import rms_norm, rms_norm_backward, rms_norm_forward
276from flag_gems.ops.roll import roll
277from flag_gems.ops.round import round, round_, round_out
278from flag_gems.ops.rrelu_with_noise_backward import rrelu_with_noise_backward
279from flag_gems.ops.rsqrt import rsqrt, rsqrt_
280from flag_gems.ops.scaled_softmax import scaled_softmax_backward, scaled_softmax_forward
281from flag_gems.ops.scatter import scatter, scatter_
282from flag_gems.ops.scatter_add_ import scatter_add_
283from flag_gems.ops.select_backward import select_backward
284from flag_gems.ops.select_scatter import select_scatter
285from flag_gems.ops.selu import selu
286from flag_gems.ops.selu_ import selu_
287from flag_gems.ops.sgn_ import sgn_
288from flag_gems.ops.sigmoid import sigmoid, sigmoid_, sigmoid_backward
289from flag_gems.ops.signbit import signbit, signbit_out
290from flag_gems.ops.silu import silu, silu_, silu_backward
291from flag_gems.ops.sin import sin, sin_
292from flag_gems.ops.sinh_ import sinh_
293from flag_gems.ops.slice_backward import slice_backward
294from flag_gems.ops.slice_scatter import slice_scatter
295from flag_gems.ops.soft_margin_loss import soft_margin_loss, soft_margin_loss_out
296from flag_gems.ops.softmax import (
297 softmax,
298 softmax_backward,
299 softmax_backward_out,
300 softmax_out,
301)
302from flag_gems.ops.softplus import softplus
303from flag_gems.ops.softshrink import softshrink, softshrink_out
304from flag_gems.ops.sort import sort, sort_stable
305from flag_gems.ops.special_i0e import special_i0e, special_i0e_out
306from flag_gems.ops.special_i1 import special_i1, special_i1_out
307from flag_gems.ops.sqrt import sqrt, sqrt_
308from flag_gems.ops.square import square, square_, square_out
309from flag_gems.ops.stack import stack
310from flag_gems.ops.std import std
311from flag_gems.ops.sub import sub, sub_
312from flag_gems.ops.sum import sum, sum_dim, sum_dim_out, sum_out
313from flag_gems.ops.t_copy import t_copy, t_copy_out
314from flag_gems.ops.tan import tan, tan_
315from flag_gems.ops.tanh import tanh, tanh_, tanh_backward
316from flag_gems.ops.threshold import threshold, threshold_backward
317from flag_gems.ops.tile import tile
318from flag_gems.ops.to import to_copy
319from flag_gems.ops.topk import topk
320from flag_gems.ops.trace import trace
321from flag_gems.ops.tril import tril, tril_out
322from flag_gems.ops.triu import triu, triu_
323from flag_gems.ops.unfold_backward import unfold_backward
324from flag_gems.ops.uniform import uniform_
325from flag_gems.ops.unique import _unique2
326from flag_gems.ops.unique_consecutive import unique_consecutive
327from flag_gems.ops.upsample_bicubic2d import upsample_bicubic2d
328from flag_gems.ops.upsample_bicubic2d_aa import _upsample_bicubic2d_aa
329from flag_gems.ops.upsample_bicubic2d_aa_backward import _upsample_bicubic2d_aa_backward
330from flag_gems.ops.upsample_linear1d import upsample_linear1d
331from flag_gems.ops.upsample_nearest1d import upsample_nearest1d
332from flag_gems.ops.upsample_nearest2d import upsample_nearest2d
333from flag_gems.ops.upsample_nearest3d import upsample_nearest3d
334from flag_gems.ops.var import var, var_correction, var_dim
335from flag_gems.ops.var_mean import var_mean
336from flag_gems.ops.vdot import vdot
337from flag_gems.ops.vector_norm import vector_norm
338from flag_gems.ops.vstack import vstack
339from flag_gems.ops.w8a8_block_fp8_matmul import w8a8_block_fp8_matmul
340from flag_gems.ops.weightnorm import (
341 weight_norm_interface,
342 weight_norm_interface_backward,
343)
344from flag_gems.ops.where import (
345 where_scalar_other,
346 where_scalar_self,
347 where_self,
348 where_self_out,
349)
350from flag_gems.ops.zero import zero, zero_out
351from flag_gems.ops.zeros import zero_, zeros
352from flag_gems.ops.zeros_like import zeros_like
354__all__ = [
355 "_assert_async",
356 "_conv_depthwise2d",
357 "_functional_sym_constrain_range_for_size",
358 "_index_put_impl_",
359 "_is_all_true",
360 "_safe_softmax",
361 "_unique2",
362 "_upsample_bicubic2d_aa",
363 "_upsample_bicubic2d_aa_backward",
364 "_upsample_nearest_exact1d",
365 "abs",
366 "abs_",
367 "absolute",
368 "act_quant_triton",
369 "acos",
370 "add",
371 "add_",
372 "addcdiv",
373 "addcdiv_out",
374 "addcmul",
375 "addcmul_out",
376 "addmm",
377 "addmm_dtype",
378 "addmm_dtype_out",
379 "addmm_out",
380 "addmv",
381 "addmv_out",
382 "addr",
383 "alias_copy",
384 "alias_copy_out",
385 "all",
386 "all_dim",
387 "all_dims",
388 "allclose",
389 "amax",
390 "aminmax",
391 "angle",
392 "any",
393 "any_dim",
394 "any_dims",
395 "arange",
396 "arange_start",
397 "arcsinh",
398 "arcsinh_out",
399 "arctanh_",
400 "arcsinh_",
401 "argmax",
402 "argmin",
403 "asinh",
404 "asinh_",
405 "asinh_out",
406 "atan",
407 "atan_",
408 "atan2",
409 "atan2_out",
410 "avg_pool2d",
411 "avg_pool2d_backward",
412 "avg_pool3d",
413 "avg_pool3d_backward",
414 "baddbmm",
415 "baddbmm_out",
416 "batch_norm",
417 "batch_norm_backward",
418 "bernoulli_",
419 "bitwise_and_scalar",
420 "bitwise_and_scalar_",
421 "bitwise_and_scalar_tensor",
422 "bitwise_and_tensor",
423 "bitwise_and_tensor_",
424 "bitwise_left_shift",
425 "bitwise_not",
426 "bitwise_not_",
427 "bitwise_or_scalar",
428 "bitwise_or_scalar_",
429 "bitwise_or_scalar_tensor",
430 "bitwise_or_tensor",
431 "bitwise_or_tensor_",
432 "bitwise_right_shift",
433 "bmm",
434 "bmm_out",
435 "cat",
436 "cat_out",
437 "ceil",
438 "ceil_",
439 "ceil_out",
440 "celu",
441 "celu_",
442 "clamp",
443 "clamp_",
444 "clamp_min",
445 "clamp_min_",
446 "clamp_tensor",
447 "clamp_tensor_",
448 "clip",
449 "clip_",
450 "constant_pad_nd",
451 "contiguous",
452 "conv1d",
453 "conv2d",
454 "conv3d",
455 "copy",
456 "copy_",
457 "copysign",
458 "copysign_out",
459 "cos",
460 "cos_",
461 "cosh",
462 "cosh_",
463 "cosh_out",
464 "count_nonzero",
465 "cummax",
466 "cummin",
467 "cumsum",
468 "cumsum_out",
469 "conj_physical",
470 "diag",
471 "diag_embed",
472 "diagonal_backward",
473 "digamma_",
474 "div_mode",
475 "div_mode_",
476 "dot",
477 "dropout",
478 "dropout_backward",
479 "elu",
480 "elu_",
481 "elu_backward",
482 "embedding",
483 "embedding_backward",
484 "embedding_dense_backward",
485 "eq",
486 "eq_scalar",
487 "equal",
488 "erf",
489 "erf_",
490 "exp",
491 "exp_",
492 "exp_out",
493 "exp2",
494 "exp2_",
495 "expm1",
496 "expm1_",
497 "expm1_out",
498 "exponential_",
499 "eye",
500 "eye_m",
501 "fill_scalar",
502 "fill_scalar_",
503 "fill_scalar_out",
504 "fill_tensor",
505 "fill_tensor_",
506 "fill_tensor_out",
507 "flash_attention_forward",
508 "flash_attn_varlen_func",
509 "flash_attn_varlen_opt_func",
510 "flip",
511 "floor_",
512 "floor_divide",
513 "floor_divide_",
514 "fmin",
515 "fmin_out",
516 "full",
517 "full_like",
518 "gather",
519 "gather_backward",
520 "gcd",
521 "gcd_out",
522 "ge",
523 "ge_scalar",
524 "gelu",
525 "gelu_",
526 "gelu_backward",
527 "get_paged_mqa_logits_metadata",
528 "get_scheduler_metadata",
529 "glu",
530 "glu_backward",
531 "grid_sample",
532 "greater",
533 "greater_out",
534 "greater_scalar",
535 "greater_scalar_out",
536 "group_mm",
537 "group_norm",
538 "group_norm_backward",
539 "gt",
540 "gt_scalar",
541 "hadamard_transform",
542 "hardsigmoid",
543 "hardsigmoid_out",
544 "hardswish_",
545 "hstack",
546 "hypot",
547 "hypot_out",
548 "i0",
549 "i0_out",
550 "i0_",
551 "index",
552 "index_add",
553 "index_add_",
554 "index_put",
555 "index_put_",
556 "index_select",
557 "isclose",
558 "isfinite",
559 "isin",
560 "isinf",
561 "isnan",
562 "isneginf",
563 "isneginf_out",
564 "kron",
565 "layer_norm",
566 "layer_norm_backward",
567 "leaky_relu",
568 "leaky_relu_",
569 "leaky_relu_out",
570 "le",
571 "le_scalar",
572 "lerp_scalar",
573 "lerp_scalar_",
574 "lerp_tensor",
575 "lerp_tensor_",
576 "lift_fresh_copy",
577 "lift_fresh_copy_out",
578 "linspace",
579 "log",
580 "log10",
581 "log10_",
582 "log10_out",
583 "log_sigmoid",
584 "log_softmax",
585 "log_softmax_backward",
586 "log_softmax_backward_out",
587 "log_softmax_out",
588 "log1p_",
589 "logaddexp",
590 "logaddexp_out",
591 "logical_and",
592 "logical_and_",
593 "logical_not",
594 "logical_or",
595 "logical_or_",
596 "logical_xor",
597 "logit",
598 "logit_out",
599 "logit_",
600 "logspace",
601 "lt",
602 "lt_scalar",
603 "margin_ranking_loss",
604 "masked_fill",
605 "masked_fill_",
606 "masked_scatter",
607 "masked_scatter_",
608 "masked_select",
609 "max",
610 "max_dim",
611 "max_pool2d_with_indices",
612 "max_pool2d_backward",
613 "max_pool3d_with_indices",
614 "max_pool3d_backward",
615 "maximum",
616 "mean",
617 "mean_dim",
618 "min",
619 "min_dim",
620 "minimum",
621 "mm",
622 "mm_out",
623 "mse_loss",
624 "mul",
625 "mul_",
626 "multinomial",
627 "mv",
628 "nan_to_num",
629 "ne",
630 "ne_scalar",
631 "neg",
632 "neg_",
633 "new_full",
634 "nll_loss_backward",
635 "nll_loss_forward",
636 "nll_loss2d_backward",
637 "nll_loss2d_forward",
638 "nll_loss_nd_forward",
639 "nll_loss_nd_backward",
640 "nonzero",
641 "normal_float_tensor",
642 "normal_tensor_float",
643 "normal_tensor_tensor",
644 "normal_",
645 "normed_cumsum",
646 "ones",
647 "ones_like",
648 "one_hot",
649 "pad",
650 "per_token_group_quant_fp8",
651 "pixel_shuffle",
652 "pixel_unshuffle",
653 "pixel_unshuffle_out",
654 "polar",
655 "pow_scalar",
656 "pow_tensor_scalar",
657 "pow_tensor_scalar_",
658 "pow_tensor_tensor",
659 "pow_tensor_tensor_",
660 "prelu",
661 "prod",
662 "prod_dim",
663 "quantile",
664 "rand",
665 "rand_like",
666 "randn",
667 "randn_like",
668 "randperm",
669 "reciprocal",
670 "reciprocal_",
671 "reflection_pad2d",
672 "reflection_pad2d_out",
673 "reflection_pad1d",
674 "reflection_pad1d_out",
675 "relu",
676 "relu_",
677 "relu6",
678 "remainder",
679 "remainder_",
680 "repeat",
681 "repeat_interleave_self_int",
682 "repeat_interleave_self_tensor",
683 "repeat_interleave_tensor",
684 "replication_pad1d",
685 "replication_pad1d_out",
686 "replication_pad3d",
687 "resolve_conj",
688 "resolve_neg",
689 "rms_norm",
690 "rms_norm_backward",
691 "rms_norm_forward",
692 "roll",
693 "round",
694 "round_",
695 "round_out",
696 "rrelu_with_noise_backward",
697 "rsqrt",
698 "rsqrt_",
699 "scaled_dot_product_attention",
700 "scaled_dot_product_attention_backward",
701 "scaled_dot_product_attention_forward",
702 "scaled_softmax_backward",
703 "scaled_softmax_forward",
704 "scatter",
705 "scatter_",
706 "scatter_add_",
707 "select_backward",
708 "select_scatter",
709 "selu",
710 "selu_",
711 "sgn_",
712 "sigmoid",
713 "sigmoid_",
714 "sigmoid_backward",
715 "signbit",
716 "signbit_out",
717 "silu",
718 "silu_",
719 "silu_backward",
720 "sin",
721 "sin_",
722 "sinh_",
723 "slice_backward",
724 "slice_scatter",
725 "soft_margin_loss",
726 "soft_margin_loss_out",
727 "softmax",
728 "softmax_backward",
729 "softmax_backward_out",
730 "softmax_out",
731 "softplus",
732 "softshrink",
733 "softshrink_out",
734 "sort",
735 "sort_stable",
736 "special_i1",
737 "special_i1_out",
738 "special_i0e",
739 "special_i0e_out",
740 "sqrt",
741 "sqrt_",
742 "square",
743 "square_",
744 "square_out",
745 "stack",
746 "std",
747 "sub",
748 "sub_",
749 "sum",
750 "sum_dim",
751 "sum_dim_out",
752 "sum_out",
753 "ScaleDotProductAttention",
754 "SUPPORTED_FP8_DTYPE",
755 "t_copy",
756 "t_copy_out",
757 "tan",
758 "tan_",
759 "tanh",
760 "tanh_",
761 "tanh_backward",
762 "threshold",
763 "threshold_backward",
764 "tile",
765 "to_copy",
766 "topk",
767 "trace",
768 "tril",
769 "tril_out",
770 "triu",
771 "triu_",
772 "true_divide",
773 "true_divide_",
774 "true_divide_out",
775 "unfold_backward",
776 "uniform_",
777 "unique_consecutive",
778 "upsample_bicubic2d",
779 "upsample_linear1d",
780 "upsample_nearest1d",
781 "upsample_nearest2d",
782 "upsample_nearest3d",
783 "var_mean",
784 "var",
785 "var_correction",
786 "var_dim",
787 "vdot",
788 "vector_norm",
789 "vstack",
790 "fp8_matmul",
791 "w8a8_block_fp8_matmul",
792 "weight_norm_interface",
793 "weight_norm_interface_backward",
794 "where_scalar_other",
795 "where_scalar_self",
796 "where_self",
797 "where_self_out",
798 "zero",
799 "zero_out",
800 "zero_",
801 "zeros",
802 "zeros_like",
803]