Coverage for src/flag_gems/ops/__init__.py: 100%

291 statements  

« prev     ^ index     » next       coverage.py v7.6.9, created at 2026-06-04 09:03 +0800

1from flag_gems.ops._euclidean_dist import _euclidean_dist 

2from flag_gems.ops._functional_sym_constrain_range_for_size import ( 

3 _functional_sym_constrain_range_for_size, 

4) 

5from flag_gems.ops._is_all_true import _is_all_true 

6from flag_gems.ops._safe_softmax import _safe_softmax 

7from flag_gems.ops._upsample_nearest_exact1d import _upsample_nearest_exact1d 

8from flag_gems.ops.abs import abs, abs_ 

9from flag_gems.ops.absolute import absolute 

10from flag_gems.ops.acos import acos 

11from flag_gems.ops.act_quant import act_quant_triton 

12from flag_gems.ops.add import add, add_ 

13from flag_gems.ops.addcdiv import addcdiv, addcdiv_out 

14from flag_gems.ops.addcmul import addcmul, addcmul_out 

15from flag_gems.ops.addmm import addmm, addmm_dtype, addmm_dtype_out, addmm_out 

16from flag_gems.ops.addmv import addmv, addmv_out 

17from flag_gems.ops.addr import addr 

18from flag_gems.ops.affine_grid_generator import affine_grid_generator 

19from flag_gems.ops.alias_copy import alias_copy, alias_copy_out 

20from flag_gems.ops.all import all, all_dim, all_dims 

21from flag_gems.ops.amax import amax 

22from flag_gems.ops.aminmax import aminmax 

23from flag_gems.ops.angle import angle 

24from flag_gems.ops.any import any, any_dim, any_dims 

25from flag_gems.ops.arange import arange, arange_start 

26from flag_gems.ops.arcsinh import arcsinh, arcsinh_out 

27from flag_gems.ops.arcsinh_ import arcsinh_ 

28from flag_gems.ops.arctanh_ import arctanh_ 

29from flag_gems.ops.argmax import argmax 

30from flag_gems.ops.argmin import argmin 

31from flag_gems.ops.argsort import argsort 

32from flag_gems.ops.as_strided_copy import as_strided_copy, as_strided_copy_out 

33from flag_gems.ops.asinh import asinh, asinh_out 

34from flag_gems.ops.asinh_ import asinh_ 

35from flag_gems.ops.assert_async import _assert_async 

36from flag_gems.ops.atan import atan, atan_ 

37from flag_gems.ops.atan2 import atan2, atan2_out 

38from flag_gems.ops.attention import ( 

39 ScaleDotProductAttention, 

40 flash_attention_forward, 

41 flash_attn_varlen_func, 

42 flash_attn_varlen_opt_func, 

43 scaled_dot_product_attention, 

44 scaled_dot_product_attention_backward, 

45 scaled_dot_product_attention_forward, 

46) 

47from flag_gems.ops.avg_pool2d import avg_pool2d, avg_pool2d_backward 

48from flag_gems.ops.avg_pool3d import avg_pool3d, avg_pool3d_backward 

49from flag_gems.ops.baddbmm import baddbmm, baddbmm_out 

50from flag_gems.ops.batch_norm import batch_norm, batch_norm_backward 

51from flag_gems.ops.bernoulli_ import bernoulli_ 

52from flag_gems.ops.bincount import bincount 

53from flag_gems.ops.bitwise_and import ( 

54 bitwise_and_scalar, 

55 bitwise_and_scalar_, 

56 bitwise_and_scalar_tensor, 

57 bitwise_and_tensor, 

58 bitwise_and_tensor_, 

59) 

60from flag_gems.ops.bitwise_left_shift import bitwise_left_shift 

61from flag_gems.ops.bitwise_not import bitwise_not, bitwise_not_ 

62from flag_gems.ops.bitwise_or import ( 

63 bitwise_or_scalar, 

64 bitwise_or_scalar_, 

65 bitwise_or_scalar_tensor, 

66 bitwise_or_tensor, 

67 bitwise_or_tensor_, 

68) 

69from flag_gems.ops.bitwise_right_shift import bitwise_right_shift 

70from flag_gems.ops.bmm import bmm, bmm_out 

71from flag_gems.ops.cat import cat, cat_out 

72from flag_gems.ops.cauchy import cauchy, cauchy_ 

73from flag_gems.ops.ceil import ceil, ceil_, ceil_out 

74from flag_gems.ops.celu import celu, celu_ 

75from flag_gems.ops.clamp import ( 

76 clamp, 

77 clamp_, 

78 clamp_min, 

79 clamp_min_, 

80 clamp_tensor, 

81 clamp_tensor_, 

82) 

83from flag_gems.ops.clamp_max import clamp_max, clamp_max_ # noqa: F401 

84from flag_gems.ops.clip import clip, clip_ 

85from flag_gems.ops.col2im import col2im 

86from flag_gems.ops.concatenate import concatenate 

87from flag_gems.ops.conj_physical import conj_physical 

88from flag_gems.ops.contiguous import contiguous 

89from flag_gems.ops.conv1d import conv1d 

90from flag_gems.ops.conv2d import conv2d 

91from flag_gems.ops.conv3d import conv3d 

92from flag_gems.ops.conv_depthwise2d import _conv_depthwise2d 

93from flag_gems.ops.conv_transpose1d import conv_transpose1d 

94from flag_gems.ops.conv_transpose2d import conv_transpose2d 

95from flag_gems.ops.copy import copy, copy_ 

96from flag_gems.ops.copysign import copysign, copysign_out 

97from flag_gems.ops.cos import cos, cos_ 

98from flag_gems.ops.cosh import cosh, cosh_, cosh_out 

99from flag_gems.ops.count_nonzero import count_nonzero 

100from flag_gems.ops.ctc_loss import ctc_loss 

101from flag_gems.ops.cudnn_convolution import cudnn_convolution 

102from flag_gems.ops.cummax import cummax 

103from flag_gems.ops.cummin import cummin 

104from flag_gems.ops.cumprod import cumprod, cumprod_ 

105from flag_gems.ops.cumsum import cumsum, cumsum_out, normed_cumsum 

106from flag_gems.ops.diag import diag 

107from flag_gems.ops.diag_embed import diag_embed 

108from flag_gems.ops.diagonal import diagonal_backward 

109from flag_gems.ops.diff import diff 

110from flag_gems.ops.digamma_ import digamma_ 

111from flag_gems.ops.div import ( 

112 div_mode, 

113 div_mode_, 

114 floor_divide, 

115 floor_divide_, 

116 true_divide, 

117 true_divide_, 

118 true_divide_out, 

119) 

120from flag_gems.ops.dot import dot 

121from flag_gems.ops.dropout import dropout, dropout_backward 

122from flag_gems.ops.elu import elu, elu_, elu_backward 

123from flag_gems.ops.embedding import embedding, embedding_backward 

124from flag_gems.ops.embedding_dense_backward import embedding_dense_backward 

125from flag_gems.ops.eq import eq, eq_scalar, equal 

126from flag_gems.ops.erf import erf, erf_ 

127from flag_gems.ops.exp import exp, exp_, exp_out 

128from flag_gems.ops.exp2 import exp2, exp2_ 

129from flag_gems.ops.expm1 import expm1, expm1_, expm1_out 

130from flag_gems.ops.exponential_ import exponential_ 

131from flag_gems.ops.eye import eye 

132from flag_gems.ops.eye_m import eye_m 

133from flag_gems.ops.feature_dropout import feature_dropout, feature_dropout_ 

134from flag_gems.ops.fft import fft 

135from flag_gems.ops.fill import ( 

136 fill_scalar, 

137 fill_scalar_, 

138 fill_scalar_out, 

139 fill_tensor, 

140 fill_tensor_, 

141 fill_tensor_out, 

142) 

143from flag_gems.ops.flip import flip 

144from flag_gems.ops.floor import floor, floor_out 

145from flag_gems.ops.floor_ import floor_ 

146from flag_gems.ops.fmin import fmin, fmin_out 

147from flag_gems.ops.fmod import fmod_scalar, fmod_scalar_, fmod_tensor, fmod_tensor_ 

148from flag_gems.ops.fp8_matmul import fp8_matmul 

149from flag_gems.ops.fp8_mqa_logits import fp8_mqa_logits 

150from flag_gems.ops.full import full 

151from flag_gems.ops.full_like import full_like 

152from flag_gems.ops.gather import gather, gather_backward 

153from flag_gems.ops.gcd import gcd, gcd_out 

154from flag_gems.ops.ge import ge, ge_scalar 

155from flag_gems.ops.gelu import gelu, gelu_, gelu_backward 

156from flag_gems.ops.get_paged_mqa_logits_metadata import get_paged_mqa_logits_metadata 

157from flag_gems.ops.get_scheduler_metadata import get_scheduler_metadata 

158from flag_gems.ops.glu import glu, glu_backward 

159from flag_gems.ops.greater import ( 

160 greater, 

161 greater_out, 

162 greater_scalar, 

163 greater_scalar_out, 

164) 

165from flag_gems.ops.grid_sample import grid_sample 

166from flag_gems.ops.group_gemm import group_mm 

167from flag_gems.ops.groupnorm import group_norm, group_norm_backward 

168from flag_gems.ops.gt import gt, gt_scalar 

169from flag_gems.ops.hadamard_transform import ( 

170 hadamard_transform, 

171 hadamard_transform_12N, 

172 hadamard_transform_20N, 

173 hadamard_transform_28N, 

174 hadamard_transform_40N, 

175) 

176from flag_gems.ops.hardsigmoid import hardsigmoid, hardsigmoid_out 

177from flag_gems.ops.hardswish_ import hardswish_ 

178from flag_gems.ops.histc import histc 

179from flag_gems.ops.hstack import hstack 

180from flag_gems.ops.hypot import hypot, hypot_out 

181from flag_gems.ops.i0 import i0, i0_out 

182from flag_gems.ops.i0_ import i0_ 

183from flag_gems.ops.index import index 

184from flag_gems.ops.index_add import index_add, index_add_ 

185from flag_gems.ops.index_copy_ import index_copy, index_copy_ 

186from flag_gems.ops.index_put import _index_put_impl_, index_put, index_put_ 

187from flag_gems.ops.index_select import index_select 

188from flag_gems.ops.isclose import allclose, isclose 

189from flag_gems.ops.isfinite import isfinite 

190from flag_gems.ops.isin import isin 

191from flag_gems.ops.isinf import isinf 

192from flag_gems.ops.isnan import isnan 

193from flag_gems.ops.isneginf import isneginf, isneginf_out 

194from flag_gems.ops.kron import kron 

195from flag_gems.ops.layernorm import layer_norm, layer_norm_backward 

196from flag_gems.ops.le import le, le_scalar 

197from flag_gems.ops.leaky_relu import leaky_relu, leaky_relu_, leaky_relu_out 

198from flag_gems.ops.lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_ 

199from flag_gems.ops.lift_fresh_copy import lift_fresh_copy, lift_fresh_copy_out 

200from flag_gems.ops.linspace import linspace 

201from flag_gems.ops.log import log 

202from flag_gems.ops.log1p import log1p 

203from flag_gems.ops.log1p_ import log1p_ 

204from flag_gems.ops.log10 import log10, log10_, log10_out 

205from flag_gems.ops.log_sigmoid import log_sigmoid 

206from flag_gems.ops.log_softmax import ( 

207 log_softmax, 

208 log_softmax_backward, 

209 log_softmax_backward_out, 

210 log_softmax_out, 

211) 

212from flag_gems.ops.logaddexp import logaddexp, logaddexp_out 

213from flag_gems.ops.logical_and import logical_and, logical_and_ 

214from flag_gems.ops.logical_not import logical_not 

215from flag_gems.ops.logical_or import logical_or, logical_or_ 

216from flag_gems.ops.logical_xor import logical_xor 

217from flag_gems.ops.logit import logit, logit_out 

218from flag_gems.ops.logit_ import logit_ 

219from flag_gems.ops.logspace import logspace 

220from flag_gems.ops.logsumexp import logsumexp 

221from flag_gems.ops.lt import lt, lt_scalar 

222from flag_gems.ops.margin_ranking_loss import margin_ranking_loss 

223from flag_gems.ops.masked_fill import masked_fill, masked_fill_ 

224from flag_gems.ops.masked_scatter import masked_scatter, masked_scatter_ 

225from flag_gems.ops.masked_select import masked_select 

226from flag_gems.ops.max import max, max_dim 

227from flag_gems.ops.max_pool2d_with_indices import ( 

228 max_pool2d_backward, 

229 max_pool2d_with_indices, 

230) 

231from flag_gems.ops.max_pool3d_with_indices import ( 

232 max_pool3d_backward, 

233 max_pool3d_with_indices, 

234) 

235from flag_gems.ops.maximum import maximum 

236from flag_gems.ops.mean import mean, mean_dim 

237from flag_gems.ops.median import median, median_dim, median_dim_values, median_out 

238from flag_gems.ops.min import min, min_dim 

239from flag_gems.ops.minimum import minimum 

240from flag_gems.ops.mm import mm, mm_out, router_gemm 

241from flag_gems.ops.mse_loss import mse_loss 

242from flag_gems.ops.mul import mul, mul_ 

243from flag_gems.ops.multinomial import multinomial 

244from flag_gems.ops.mv import mv 

245from flag_gems.ops.nan_to_num import nan_to_num 

246from flag_gems.ops.ne import ne, ne_scalar 

247from flag_gems.ops.neg import neg, neg_ 

248from flag_gems.ops.new_full import new_full 

249from flag_gems.ops.nll_loss_nd import nll_loss_nd_backward, nll_loss_nd_forward 

250from flag_gems.ops.nllloss import ( 

251 nll_loss2d_backward, 

252 nll_loss2d_forward, 

253 nll_loss_backward, 

254 nll_loss_forward, 

255) 

256from flag_gems.ops.nonzero import nonzero 

257from flag_gems.ops.nonzero_numpy import nonzero_numpy 

258from flag_gems.ops.normal import ( 

259 normal_, 

260 normal_float_tensor, 

261 normal_tensor_float, 

262 normal_tensor_tensor, 

263) 

264from flag_gems.ops.one_hot import one_hot 

265from flag_gems.ops.ones import ones 

266from flag_gems.ops.ones_like import ones_like 

267from flag_gems.ops.pad import constant_pad_nd, pad 

268from flag_gems.ops.per_token_group_quant_fp8 import ( 

269 SUPPORTED_FP8_DTYPE, 

270 per_token_group_quant_fp8, 

271) 

272from flag_gems.ops.pixel_shuffle import pixel_shuffle 

273from flag_gems.ops.pixel_unshuffle import pixel_unshuffle, pixel_unshuffle_out 

274from flag_gems.ops.poisson import poisson 

275from flag_gems.ops.polar import polar 

276from flag_gems.ops.pow import ( 

277 pow_scalar, 

278 pow_tensor_scalar, 

279 pow_tensor_scalar_, 

280 pow_tensor_tensor, 

281 pow_tensor_tensor_, 

282) 

283from flag_gems.ops.prelu import prelu 

284from flag_gems.ops.prod import prod, prod_dim 

285from flag_gems.ops.quantile import quantile 

286from flag_gems.ops.rad2deg import rad2deg, rad2deg_ 

287from flag_gems.ops.rand import rand 

288from flag_gems.ops.rand_like import rand_like 

289from flag_gems.ops.randint import randint 

290from flag_gems.ops.randn import randn 

291from flag_gems.ops.randn_like import randn_like 

292from flag_gems.ops.randperm import randperm 

293from flag_gems.ops.reciprocal import reciprocal, reciprocal_ 

294from flag_gems.ops.reflection_pad1d import reflection_pad1d, reflection_pad1d_out 

295from flag_gems.ops.reflection_pad1d_backward import reflection_pad1d_backward 

296from flag_gems.ops.reflection_pad2d import reflection_pad2d, reflection_pad2d_out 

297from flag_gems.ops.relu import relu, relu_ 

298from flag_gems.ops.relu6 import relu6 

299from flag_gems.ops.remainder import remainder, remainder_ 

300from flag_gems.ops.repeat import repeat 

301from flag_gems.ops.repeat_interleave import ( 

302 repeat_interleave_self_int, 

303 repeat_interleave_self_tensor, 

304 repeat_interleave_tensor, 

305) 

306from flag_gems.ops.replication_pad1d import replication_pad1d, replication_pad1d_out 

307from flag_gems.ops.replication_pad3d import replication_pad3d 

308from flag_gems.ops.resolve_conj import resolve_conj 

309from flag_gems.ops.resolve_neg import resolve_neg 

310from flag_gems.ops.rms_norm import rms_norm, rms_norm_backward, rms_norm_forward 

311from flag_gems.ops.roll import roll 

312from flag_gems.ops.round import round, round_, round_out 

313from flag_gems.ops.rrelu_with_noise_backward import rrelu_with_noise_backward 

314from flag_gems.ops.rsqrt import rsqrt, rsqrt_ 

315from flag_gems.ops.rsub import rsub_scalar, rsub_tensor 

316from flag_gems.ops.scaled_mm import scaled_mm, scaled_mm_out 

317from flag_gems.ops.scaled_softmax import scaled_softmax_backward, scaled_softmax_forward 

318from flag_gems.ops.scatter import scatter, scatter_ 

319from flag_gems.ops.scatter_add_ import scatter_add_ 

320from flag_gems.ops.scatter_reduce import ( 

321 scatter_reduce, 

322 scatter_reduce_, 

323 scatter_reduce_out, 

324) 

325from flag_gems.ops.select_backward import select_backward 

326from flag_gems.ops.select_scatter import select_scatter 

327from flag_gems.ops.selu import selu 

328from flag_gems.ops.selu_ import selu_ 

329from flag_gems.ops.sgn_ import sgn_ 

330from flag_gems.ops.sigmoid import sigmoid, sigmoid_, sigmoid_backward 

331from flag_gems.ops.signbit import signbit, signbit_out 

332from flag_gems.ops.silu import silu, silu_, silu_backward 

333from flag_gems.ops.sin import sin, sin_ 

334from flag_gems.ops.sinh_ import sinh_ 

335from flag_gems.ops.slice_backward import slice_backward 

336from flag_gems.ops.slice_scatter import slice_scatter 

337from flag_gems.ops.smooth_l1_loss import ( 

338 smooth_l1_loss, 

339 smooth_l1_loss_backward, 

340 smooth_l1_loss_out, 

341) 

342from flag_gems.ops.soft_margin_loss import soft_margin_loss, soft_margin_loss_out 

343from flag_gems.ops.softmax import ( 

344 softmax, 

345 softmax_backward, 

346 softmax_backward_out, 

347 softmax_out, 

348) 

349from flag_gems.ops.softplus import softplus 

350from flag_gems.ops.softshrink import softshrink, softshrink_out 

351from flag_gems.ops.sort import sort, sort_stable 

352from flag_gems.ops.special_i0e import special_i0e, special_i0e_out 

353from flag_gems.ops.special_i1 import special_i1, special_i1_out 

354from flag_gems.ops.sqrt import sqrt, sqrt_ 

355from flag_gems.ops.square import square, square_, square_out 

356from flag_gems.ops.stack import stack 

357from flag_gems.ops.std import std 

358from flag_gems.ops.sub import sub, sub_ 

359from flag_gems.ops.sum import sum, sum_dim, sum_dim_out, sum_out 

360from flag_gems.ops.svd import svd 

361from flag_gems.ops.t_copy import t_copy, t_copy_out 

362from flag_gems.ops.tan import tan, tan_ 

363from flag_gems.ops.tanh import tanh, tanh_, tanh_backward 

364from flag_gems.ops.threshold import threshold, threshold_backward 

365from flag_gems.ops.tile import tile 

366from flag_gems.ops.to import to_copy 

367from flag_gems.ops.topk import topk 

368from flag_gems.ops.trace import trace 

369from flag_gems.ops.tril import tril, tril_, tril_out 

370from flag_gems.ops.triu import triu, triu_ 

371from flag_gems.ops.unfold_backward import unfold_backward 

372from flag_gems.ops.uniform import uniform_ 

373from flag_gems.ops.unique import _unique2 

374from flag_gems.ops.unique_consecutive import unique_consecutive 

375from flag_gems.ops.upsample_bicubic2d import upsample_bicubic2d 

376from flag_gems.ops.upsample_bicubic2d_aa import _upsample_bicubic2d_aa 

377from flag_gems.ops.upsample_bicubic2d_aa_backward import _upsample_bicubic2d_aa_backward 

378from flag_gems.ops.upsample_linear1d import upsample_linear1d 

379from flag_gems.ops.upsample_nearest1d import upsample_nearest1d 

380from flag_gems.ops.upsample_nearest2d import upsample_nearest2d 

381from flag_gems.ops.upsample_nearest3d import upsample_nearest3d 

382from flag_gems.ops.var import var, var_correction, var_dim 

383from flag_gems.ops.var_mean import var_mean 

384from flag_gems.ops.vdot import vdot 

385from flag_gems.ops.vector_norm import vector_norm 

386from flag_gems.ops.vstack import vstack 

387from flag_gems.ops.w8a8_block_fp8_matmul import w8a8_block_fp8_matmul 

388from flag_gems.ops.weightnorm import ( 

389 weight_norm_interface, 

390 weight_norm_interface_backward, 

391) 

392from flag_gems.ops.where import ( 

393 where_scalar_other, 

394 where_scalar_self, 

395 where_self, 

396 where_self_out, 

397) 

398from flag_gems.ops.zero import zero, zero_out 

399from flag_gems.ops.zeros import zero_, zeros 

400from flag_gems.ops.zeros_like import zeros_like 

401 

402__all__ = [ 

403 "_assert_async", 

404 "_conv_depthwise2d", 

405 "_euclidean_dist", 

406 "_functional_sym_constrain_range_for_size", 

407 "_index_put_impl_", 

408 "_is_all_true", 

409 "_safe_softmax", 

410 "_unique2", 

411 "_upsample_bicubic2d_aa", 

412 "_upsample_bicubic2d_aa_backward", 

413 "_upsample_nearest_exact1d", 

414 "abs", 

415 "abs_", 

416 "absolute", 

417 "acos", 

418 "act_quant_triton", 

419 "add", 

420 "add_", 

421 "addcdiv", 

422 "addcdiv_out", 

423 "addcmul", 

424 "addcmul_out", 

425 "addmm", 

426 "addmm_dtype", 

427 "addmm_dtype_out", 

428 "addmm_out", 

429 "addmv", 

430 "addmv_out", 

431 "addr", 

432 "affine_grid_generator", 

433 "alias_copy", 

434 "alias_copy_out", 

435 "all", 

436 "all_dim", 

437 "all_dims", 

438 "allclose", 

439 "amax", 

440 "aminmax", 

441 "angle", 

442 "any", 

443 "any_dim", 

444 "any_dims", 

445 "arange", 

446 "arange_start", 

447 "arcsinh", 

448 "arcsinh_", 

449 "arcsinh_out", 

450 "arctanh_", 

451 "argmax", 

452 "argmin", 

453 "argsort", 

454 "as_strided_copy", 

455 "as_strided_copy_out", 

456 "asinh", 

457 "asinh_", 

458 "asinh_out", 

459 "atan", 

460 "atan2", 

461 "atan2_out", 

462 "atan_", 

463 "avg_pool2d", 

464 "avg_pool2d_backward", 

465 "avg_pool3d", 

466 "avg_pool3d_backward", 

467 "baddbmm", 

468 "baddbmm_out", 

469 "batch_norm", 

470 "batch_norm_backward", 

471 "bernoulli_", 

472 "bincount", 

473 "bitwise_and_scalar", 

474 "bitwise_and_scalar_", 

475 "bitwise_and_scalar_tensor", 

476 "bitwise_and_tensor", 

477 "bitwise_and_tensor_", 

478 "bitwise_left_shift", 

479 "bitwise_not", 

480 "bitwise_not_", 

481 "bitwise_or_scalar", 

482 "bitwise_or_scalar_", 

483 "bitwise_or_scalar_tensor", 

484 "bitwise_or_tensor", 

485 "bitwise_or_tensor_", 

486 "bitwise_right_shift", 

487 "bmm", 

488 "bmm_out", 

489 "cat", 

490 "cat_out", 

491 "cauchy", 

492 "cauchy_", 

493 "ceil", 

494 "ceil_", 

495 "ceil_out", 

496 "celu", 

497 "celu_", 

498 "clamp", 

499 "clamp_", 

500 "clamp_max", 

501 "clamp_max_", 

502 "clamp_min", 

503 "clamp_min_", 

504 "clamp_tensor", 

505 "clamp_tensor_", 

506 "clip", 

507 "clip_", 

508 "col2im", 

509 "concatenate", 

510 "conj_physical", 

511 "constant_pad_nd", 

512 "contiguous", 

513 "conv1d", 

514 "conv2d", 

515 "conv3d", 

516 "conv_transpose1d", 

517 "conv_transpose2d", 

518 "copy", 

519 "copy_", 

520 "copysign", 

521 "copysign_out", 

522 "cos", 

523 "cos_", 

524 "cosh", 

525 "cosh_", 

526 "cosh_out", 

527 "count_nonzero", 

528 "ctc_loss", 

529 "cudnn_convolution", 

530 "cummax", 

531 "cummin", 

532 "cumprod", 

533 "cumprod_", 

534 "cumsum", 

535 "cumsum_out", 

536 "diag", 

537 "diag_embed", 

538 "diagonal_backward", 

539 "diff", 

540 "digamma_", 

541 "div_mode", 

542 "div_mode_", 

543 "dot", 

544 "dropout", 

545 "dropout_backward", 

546 "elu", 

547 "elu_", 

548 "elu_backward", 

549 "embedding", 

550 "embedding_backward", 

551 "embedding_dense_backward", 

552 "eq", 

553 "eq_scalar", 

554 "equal", 

555 "erf", 

556 "erf_", 

557 "exp", 

558 "exp2", 

559 "exp2_", 

560 "exp_", 

561 "exp_out", 

562 "expm1", 

563 "expm1_", 

564 "expm1_out", 

565 "exponential_", 

566 "eye", 

567 "eye_m", 

568 "feature_dropout", 

569 "feature_dropout_", 

570 "fft", 

571 "fill_scalar", 

572 "fill_scalar_", 

573 "fill_scalar_out", 

574 "fill_tensor", 

575 "fill_tensor_", 

576 "fill_tensor_out", 

577 "flash_attention_forward", 

578 "flash_attn_varlen_func", 

579 "flash_attn_varlen_opt_func", 

580 "flip", 

581 "floor", 

582 "floor_", 

583 "floor_out", 

584 "floor_divide", 

585 "floor_divide_", 

586 "fmin", 

587 "fmin_out", 

588 "fmod_scalar", 

589 "fmod_scalar_", 

590 "fmod_tensor", 

591 "fmod_tensor_", 

592 "fp8_matmul", 

593 "fp8_mqa_logits", 

594 "full", 

595 "full_like", 

596 "gather", 

597 "gather_backward", 

598 "gcd", 

599 "gcd_out", 

600 "ge", 

601 "ge_scalar", 

602 "gelu", 

603 "gelu_", 

604 "gelu_backward", 

605 "get_paged_mqa_logits_metadata", 

606 "get_scheduler_metadata", 

607 "glu", 

608 "glu_backward", 

609 "greater", 

610 "greater_out", 

611 "greater_scalar", 

612 "greater_scalar_out", 

613 "grid_sample", 

614 "group_mm", 

615 "group_norm", 

616 "group_norm_backward", 

617 "gt", 

618 "gt_scalar", 

619 "hadamard_transform", 

620 "hadamard_transform_12N", 

621 "hadamard_transform_20N", 

622 "hadamard_transform_28N", 

623 "hadamard_transform_40N", 

624 "hardsigmoid", 

625 "hardsigmoid_out", 

626 "hardswish_", 

627 "histc", 

628 "hstack", 

629 "hypot", 

630 "hypot_out", 

631 "i0", 

632 "i0_", 

633 "i0_out", 

634 "index", 

635 "index_add", 

636 "index_add_", 

637 "index_copy", 

638 "index_copy_", 

639 "index_put", 

640 "index_put_", 

641 "index_select", 

642 "isclose", 

643 "isfinite", 

644 "isin", 

645 "isinf", 

646 "isnan", 

647 "isneginf", 

648 "isneginf_out", 

649 "kron", 

650 "layer_norm", 

651 "layer_norm_backward", 

652 "le", 

653 "le_scalar", 

654 "leaky_relu", 

655 "leaky_relu_", 

656 "leaky_relu_out", 

657 "lerp_scalar", 

658 "lerp_scalar_", 

659 "lerp_tensor", 

660 "lerp_tensor_", 

661 "lift_fresh_copy", 

662 "lift_fresh_copy_out", 

663 "linspace", 

664 "log", 

665 "log10", 

666 "log10_", 

667 "log10_out", 

668 "log1p_", 

669 "log_sigmoid", 

670 "log_softmax", 

671 "log_softmax_backward", 

672 "log_softmax_backward_out", 

673 "log_softmax_out", 

674 "log1p", 

675 "log1p_", 

676 "logaddexp", 

677 "logaddexp_out", 

678 "logical_and", 

679 "logical_and_", 

680 "logical_not", 

681 "logical_or", 

682 "logical_or_", 

683 "logical_xor", 

684 "logit", 

685 "logit_", 

686 "logit_out", 

687 "logspace", 

688 "logsumexp", 

689 "lt", 

690 "lt_scalar", 

691 "margin_ranking_loss", 

692 "masked_fill", 

693 "masked_fill_", 

694 "masked_scatter", 

695 "masked_scatter_", 

696 "masked_select", 

697 "max", 

698 "max_dim", 

699 "max_pool2d_backward", 

700 "max_pool2d_with_indices", 

701 "max_pool3d_backward", 

702 "max_pool3d_with_indices", 

703 "maximum", 

704 "mean", 

705 "mean_dim", 

706 "median", 

707 "median_dim", 

708 "median_dim_values", 

709 "median_out", 

710 "min", 

711 "min_dim", 

712 "minimum", 

713 "mm", 

714 "mm_out", 

715 "mse_loss", 

716 "mul", 

717 "mul_", 

718 "multinomial", 

719 "mv", 

720 "nan_to_num", 

721 "ne", 

722 "ne_scalar", 

723 "neg", 

724 "neg_", 

725 "new_full", 

726 "nll_loss2d_backward", 

727 "nll_loss2d_forward", 

728 "nll_loss_backward", 

729 "nll_loss_forward", 

730 "nll_loss_nd_backward", 

731 "nll_loss_nd_forward", 

732 "nonzero", 

733 "nonzero_numpy", 

734 "normal_", 

735 "normal_float_tensor", 

736 "normal_tensor_float", 

737 "normal_tensor_tensor", 

738 "normed_cumsum", 

739 "one_hot", 

740 "ones", 

741 "ones_like", 

742 "pad", 

743 "per_token_group_quant_fp8", 

744 "pixel_shuffle", 

745 "pixel_unshuffle", 

746 "pixel_unshuffle_out", 

747 "poisson", 

748 "polar", 

749 "pow_scalar", 

750 "pow_tensor_scalar", 

751 "pow_tensor_scalar_", 

752 "pow_tensor_tensor", 

753 "pow_tensor_tensor_", 

754 "prelu", 

755 "prod", 

756 "prod_dim", 

757 "quantile", 

758 "rad2deg", 

759 "rad2deg_", 

760 "rand", 

761 "rand_like", 

762 "randint", 

763 "randn", 

764 "randn_like", 

765 "randperm", 

766 "reciprocal", 

767 "reciprocal_", 

768 "reflection_pad1d", 

769 "reflection_pad1d_backward", 

770 "reflection_pad1d_out", 

771 "reflection_pad2d", 

772 "reflection_pad2d_out", 

773 "relu", 

774 "relu6", 

775 "relu_", 

776 "remainder", 

777 "remainder_", 

778 "repeat", 

779 "repeat_interleave_self_int", 

780 "repeat_interleave_self_tensor", 

781 "repeat_interleave_tensor", 

782 "replication_pad1d", 

783 "replication_pad1d_out", 

784 "replication_pad3d", 

785 "resolve_conj", 

786 "resolve_neg", 

787 "rms_norm", 

788 "rms_norm_backward", 

789 "rms_norm_forward", 

790 "roll", 

791 "round", 

792 "round_", 

793 "round_out", 

794 "router_gemm", 

795 "rrelu_with_noise_backward", 

796 "rsqrt", 

797 "rsqrt_", 

798 "rsub_scalar", 

799 "rsub_tensor", 

800 "scaled_dot_product_attention", 

801 "scaled_dot_product_attention_backward", 

802 "scaled_dot_product_attention_forward", 

803 "scaled_mm", 

804 "scaled_mm_out", 

805 "scaled_softmax_backward", 

806 "scaled_softmax_forward", 

807 "ScaleDotProductAttention", 

808 "scatter", 

809 "scatter_", 

810 "scatter_add_", 

811 "scatter_reduce", 

812 "scatter_reduce_", 

813 "scatter_reduce_out", 

814 "select_backward", 

815 "select_scatter", 

816 "selu", 

817 "selu_", 

818 "sgn_", 

819 "sigmoid", 

820 "sigmoid_", 

821 "sigmoid_backward", 

822 "signbit", 

823 "signbit_out", 

824 "silu", 

825 "silu_", 

826 "silu_backward", 

827 "sin", 

828 "sin_", 

829 "sinh_", 

830 "slice_backward", 

831 "slice_scatter", 

832 "smooth_l1_loss", 

833 "smooth_l1_loss_backward", 

834 "smooth_l1_loss_out", 

835 "soft_margin_loss", 

836 "soft_margin_loss_out", 

837 "softmax", 

838 "softmax_backward", 

839 "softmax_backward_out", 

840 "softmax_out", 

841 "softplus", 

842 "softshrink", 

843 "softshrink_out", 

844 "sort", 

845 "sort_stable", 

846 "special_i0e", 

847 "special_i0e_out", 

848 "special_i1", 

849 "special_i1_out", 

850 "sqrt", 

851 "sqrt_", 

852 "square", 

853 "square_", 

854 "square_out", 

855 "stack", 

856 "std", 

857 "sub", 

858 "sub_", 

859 "sum", 

860 "sum_dim", 

861 "sum_dim_out", 

862 "sum_out", 

863 "SUPPORTED_FP8_DTYPE", 

864 "svd", 

865 "t_copy", 

866 "t_copy_out", 

867 "tan", 

868 "tan_", 

869 "tanh", 

870 "tanh_", 

871 "tanh_backward", 

872 "threshold", 

873 "threshold_backward", 

874 "tile", 

875 "to_copy", 

876 "topk", 

877 "trace", 

878 "tril", 

879 "tril_", 

880 "tril_out", 

881 "triu", 

882 "triu_", 

883 "true_divide", 

884 "true_divide_", 

885 "true_divide_out", 

886 "unfold_backward", 

887 "uniform_", 

888 "unique_consecutive", 

889 "upsample_bicubic2d", 

890 "upsample_linear1d", 

891 "upsample_nearest1d", 

892 "upsample_nearest2d", 

893 "upsample_nearest3d", 

894 "var", 

895 "var_correction", 

896 "var_dim", 

897 "var_mean", 

898 "vdot", 

899 "vector_norm", 

900 "vstack", 

901 "w8a8_block_fp8_matmul", 

902 "weight_norm_interface", 

903 "weight_norm_interface_backward", 

904 "where_scalar_other", 

905 "where_scalar_self", 

906 "where_self", 

907 "where_self_out", 

908 "zero", 

909 "zero_", 

910 "zero_out", 

911 "zeros", 

912 "zeros_like", 

913]