Coverage for src/flag_gems/ops/__init__.py: 100%

306 statements  

« prev     ^ index     » next       coverage.py v7.6.9, created at 2026-06-10 07:09 +0800

1from flag_gems.ops._euclidean_dist import _euclidean_dist 

2from flag_gems.ops._functional_sym_constrain_range_for_size import ( 

3 _functional_sym_constrain_range_for_size, 

4) 

5from flag_gems.ops._is_all_true import _is_all_true 

6from flag_gems.ops._safe_softmax import _safe_softmax 

7from flag_gems.ops._upsample_nearest_exact1d import _upsample_nearest_exact1d 

8from flag_gems.ops.abs import abs, abs_ 

9from flag_gems.ops.absolute import absolute 

10from flag_gems.ops.acos import acos 

11from flag_gems.ops.act_quant import act_quant_triton 

12from flag_gems.ops.add import add, add_ 

13from flag_gems.ops.addcdiv import addcdiv, addcdiv_out 

14from flag_gems.ops.addcmul import addcmul, addcmul_out 

15from flag_gems.ops.addmm import addmm, addmm_dtype, addmm_dtype_out, addmm_out 

16from flag_gems.ops.addmv import addmv, addmv_out 

17from flag_gems.ops.addr import addr 

18from flag_gems.ops.affine_grid_generator import affine_grid_generator 

19from flag_gems.ops.alias_copy import alias_copy, alias_copy_out 

20from flag_gems.ops.all import all, all_dim, all_dims 

21from flag_gems.ops.amax import amax 

22from flag_gems.ops.aminmax import aminmax 

23from flag_gems.ops.angle import angle 

24from flag_gems.ops.any import any, any_dim, any_dims 

25from flag_gems.ops.arange import arange, arange_start 

26from flag_gems.ops.arcsinh import arcsinh, arcsinh_out 

27from flag_gems.ops.arcsinh_ import arcsinh_ 

28from flag_gems.ops.arctanh_ import arctanh_ 

29from flag_gems.ops.argmax import argmax 

30from flag_gems.ops.argmin import argmin 

31from flag_gems.ops.argsort import argsort 

32from flag_gems.ops.as_strided_copy import as_strided_copy, as_strided_copy_out 

33from flag_gems.ops.asinh import asinh, asinh_out 

34from flag_gems.ops.asinh_ import asinh_ 

35from flag_gems.ops.assert_async import _assert_async 

36from flag_gems.ops.atan import atan, atan_ 

37from flag_gems.ops.atan2 import atan2, atan2_out 

38from flag_gems.ops.atanh import atanh, atanh_ 

39from flag_gems.ops.attention import ( 

40 ScaleDotProductAttention, 

41 flash_attention_forward, 

42 flash_attn_varlen_func, 

43 flash_attn_varlen_opt_func, 

44 scaled_dot_product_attention, 

45 scaled_dot_product_attention_backward, 

46 scaled_dot_product_attention_forward, 

47) 

48from flag_gems.ops.avg_pool2d import avg_pool2d, avg_pool2d_backward 

49from flag_gems.ops.avg_pool3d import avg_pool3d, avg_pool3d_backward 

50from flag_gems.ops.baddbmm import baddbmm, baddbmm_out 

51from flag_gems.ops.batch_norm import batch_norm, batch_norm_backward 

52from flag_gems.ops.bernoulli_ import bernoulli_ 

53from flag_gems.ops.bincount import bincount 

54from flag_gems.ops.bitwise_and import ( 

55 bitwise_and_scalar, 

56 bitwise_and_scalar_, 

57 bitwise_and_scalar_tensor, 

58 bitwise_and_tensor, 

59 bitwise_and_tensor_, 

60) 

61from flag_gems.ops.bitwise_left_shift import bitwise_left_shift 

62from flag_gems.ops.bitwise_not import bitwise_not, bitwise_not_ 

63from flag_gems.ops.bitwise_or import ( 

64 bitwise_or_scalar, 

65 bitwise_or_scalar_, 

66 bitwise_or_scalar_tensor, 

67 bitwise_or_tensor, 

68 bitwise_or_tensor_, 

69) 

70from flag_gems.ops.bitwise_right_shift import bitwise_right_shift 

71from flag_gems.ops.bmm import bmm, bmm_out 

72from flag_gems.ops.cat import cat, cat_out 

73from flag_gems.ops.cauchy import cauchy, cauchy_ 

74from flag_gems.ops.ceil import ceil, ceil_, ceil_out 

75from flag_gems.ops.celu import celu, celu_ 

76from flag_gems.ops.clamp import ( 

77 clamp, 

78 clamp_, 

79 clamp_min, 

80 clamp_min_, 

81 clamp_tensor, 

82 clamp_tensor_, 

83) 

84from flag_gems.ops.clamp_max import clamp_max, clamp_max_ # noqa: F401 

85from flag_gems.ops.clip import clip, clip_ 

86from flag_gems.ops.col2im import col2im 

87from flag_gems.ops.concatenate import concatenate 

88from flag_gems.ops.conj_physical import conj_physical 

89from flag_gems.ops.contiguous import contiguous 

90from flag_gems.ops.conv1d import conv1d 

91from flag_gems.ops.conv2d import conv2d 

92from flag_gems.ops.conv3d import conv3d 

93from flag_gems.ops.conv_depthwise2d import _conv_depthwise2d 

94from flag_gems.ops.conv_transpose1d import conv_transpose1d 

95from flag_gems.ops.conv_transpose2d import conv_transpose2d 

96from flag_gems.ops.copy import copy, copy_ 

97from flag_gems.ops.copysign import copysign, copysign_out 

98from flag_gems.ops.cos import cos, cos_ 

99from flag_gems.ops.cosh import cosh, cosh_, cosh_out 

100from flag_gems.ops.count_nonzero import count_nonzero 

101from flag_gems.ops.ctc_loss import ctc_loss 

102from flag_gems.ops.cudnn_convolution import cudnn_convolution 

103from flag_gems.ops.cummax import cummax 

104from flag_gems.ops.cummin import cummin 

105from flag_gems.ops.cumprod import cumprod, cumprod_ 

106from flag_gems.ops.cumsum import cumsum, cumsum_out, normed_cumsum 

107from flag_gems.ops.diag import diag 

108from flag_gems.ops.diag_embed import diag_embed 

109from flag_gems.ops.diagonal import diagonal_backward 

110from flag_gems.ops.diff import diff 

111from flag_gems.ops.digamma_ import digamma_ 

112from flag_gems.ops.div import ( 

113 div_mode, 

114 div_mode_, 

115 floor_divide, 

116 floor_divide_, 

117 true_divide, 

118 true_divide_, 

119 true_divide_out, 

120) 

121from flag_gems.ops.dot import dot 

122from flag_gems.ops.dropout import dropout, dropout_backward 

123from flag_gems.ops.elu import elu, elu_, elu_backward 

124from flag_gems.ops.embedding import embedding, embedding_backward 

125from flag_gems.ops.embedding_dense_backward import embedding_dense_backward 

126from flag_gems.ops.eq import eq, eq_scalar, equal 

127from flag_gems.ops.erf import erf, erf_ 

128from flag_gems.ops.exp import exp, exp_, exp_out 

129from flag_gems.ops.exp2 import exp2, exp2_ 

130from flag_gems.ops.expm1 import expm1, expm1_, expm1_out 

131from flag_gems.ops.exponential_ import exponential_ 

132from flag_gems.ops.eye import eye 

133from flag_gems.ops.eye_m import eye_m 

134from flag_gems.ops.feature_dropout import feature_dropout, feature_dropout_ 

135from flag_gems.ops.fft import fft 

136from flag_gems.ops.fill import ( 

137 fill_scalar, 

138 fill_scalar_, 

139 fill_scalar_out, 

140 fill_tensor, 

141 fill_tensor_, 

142 fill_tensor_out, 

143) 

144from flag_gems.ops.flip import flip 

145from flag_gems.ops.floor import floor, floor_out 

146from flag_gems.ops.floor_ import floor_ 

147from flag_gems.ops.fmin import fmin, fmin_out 

148from flag_gems.ops.fmod import fmod_scalar, fmod_scalar_, fmod_tensor, fmod_tensor_ 

149from flag_gems.ops.fmod_ import fmod_ 

150from flag_gems.ops.fp8_matmul import fp8_matmul 

151from flag_gems.ops.fp8_mqa_logits import fp8_mqa_logits 

152from flag_gems.ops.full import full 

153from flag_gems.ops.full_like import full_like 

154from flag_gems.ops.gather import gather, gather_backward 

155from flag_gems.ops.gcd import gcd, gcd_out 

156from flag_gems.ops.ge import ge, ge_scalar 

157from flag_gems.ops.gelu import gelu, gelu_, gelu_backward 

158from flag_gems.ops.get_paged_mqa_logits_metadata import get_paged_mqa_logits_metadata 

159from flag_gems.ops.get_scheduler_metadata import get_scheduler_metadata 

160from flag_gems.ops.glu import glu, glu_backward 

161from flag_gems.ops.greater import ( 

162 greater, 

163 greater_out, 

164 greater_scalar, 

165 greater_scalar_out, 

166) 

167from flag_gems.ops.grid_sample import grid_sample 

168from flag_gems.ops.group_gemm import group_mm 

169from flag_gems.ops.groupnorm import group_norm, group_norm_backward 

170from flag_gems.ops.gt import gt, gt_scalar 

171from flag_gems.ops.hadamard_transform import ( 

172 hadamard_transform, 

173 hadamard_transform_12N, 

174 hadamard_transform_20N, 

175 hadamard_transform_28N, 

176 hadamard_transform_40N, 

177) 

178from flag_gems.ops.hardsigmoid import hardsigmoid, hardsigmoid_out 

179from flag_gems.ops.hardswish_ import hardswish_ 

180from flag_gems.ops.histc import histc 

181from flag_gems.ops.hstack import hstack 

182from flag_gems.ops.hypot import hypot, hypot_out 

183from flag_gems.ops.i0 import i0, i0_out 

184from flag_gems.ops.i0_ import i0_ 

185from flag_gems.ops.index import index 

186from flag_gems.ops.index_add import index_add, index_add_ 

187from flag_gems.ops.index_copy_ import index_copy, index_copy_ 

188from flag_gems.ops.index_put import _index_put_impl_, index_put, index_put_ 

189from flag_gems.ops.index_reduce import index_reduce_ 

190from flag_gems.ops.index_select import index_select 

191from flag_gems.ops.isclose import allclose, isclose 

192from flag_gems.ops.isfinite import isfinite 

193from flag_gems.ops.isin import isin 

194from flag_gems.ops.isinf import isinf 

195from flag_gems.ops.isnan import isnan 

196from flag_gems.ops.isneginf import isneginf, isneginf_out 

197from flag_gems.ops.kron import kron 

198from flag_gems.ops.layernorm import layer_norm, layer_norm_backward 

199from flag_gems.ops.le import le, le_scalar 

200from flag_gems.ops.leaky_relu import leaky_relu, leaky_relu_, leaky_relu_out 

201from flag_gems.ops.lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_ 

202from flag_gems.ops.lift_fresh_copy import lift_fresh_copy, lift_fresh_copy_out 

203from flag_gems.ops.linspace import linspace 

204from flag_gems.ops.log import log 

205from flag_gems.ops.log1p import log1p, log1p_out 

206from flag_gems.ops.log1p_ import log1p_ 

207from flag_gems.ops.log10 import log10, log10_, log10_out 

208from flag_gems.ops.log_sigmoid import log_sigmoid 

209from flag_gems.ops.log_softmax import ( 

210 log_softmax, 

211 log_softmax_backward, 

212 log_softmax_backward_out, 

213 log_softmax_out, 

214) 

215from flag_gems.ops.logaddexp import logaddexp, logaddexp_out 

216from flag_gems.ops.logical_and import logical_and, logical_and_ 

217from flag_gems.ops.logical_not import logical_not 

218from flag_gems.ops.logical_or import logical_or, logical_or_ 

219from flag_gems.ops.logical_xor import logical_xor 

220from flag_gems.ops.logit import logit, logit_out 

221from flag_gems.ops.logit_ import logit_ 

222from flag_gems.ops.logspace import logspace 

223from flag_gems.ops.logsumexp import logsumexp 

224from flag_gems.ops.lt import lt, lt_scalar 

225from flag_gems.ops.margin_ranking_loss import margin_ranking_loss 

226from flag_gems.ops.masked_fill import masked_fill, masked_fill_ 

227from flag_gems.ops.masked_scatter import masked_scatter, masked_scatter_ 

228from flag_gems.ops.masked_select import masked_select 

229from flag_gems.ops.max import max, max_dim 

230from flag_gems.ops.max_pool2d_with_indices import ( 

231 max_pool2d_backward, 

232 max_pool2d_with_indices, 

233) 

234from flag_gems.ops.max_pool3d_with_indices import ( 

235 max_pool3d_backward, 

236 max_pool3d_with_indices, 

237) 

238from flag_gems.ops.maximum import maximum 

239from flag_gems.ops.mean import mean, mean_dim 

240from flag_gems.ops.median import median, median_dim, median_dim_values, median_out 

241from flag_gems.ops.min import min, min_dim 

242from flag_gems.ops.minimum import minimum 

243from flag_gems.ops.mm import mm, mm_out, router_gemm 

244from flag_gems.ops.mse_loss import mse_loss 

245from flag_gems.ops.mul import mul, mul_ 

246from flag_gems.ops.multinomial import multinomial 

247from flag_gems.ops.mv import mv 

248from flag_gems.ops.nan_to_num import nan_to_num 

249from flag_gems.ops.nanmedian import ( 

250 nanmedian, 

251 nanmedian_dim, 

252 nanmedian_dim_values, 

253 nanmedian_out, 

254) 

255from flag_gems.ops.ne import ne, ne_scalar 

256from flag_gems.ops.neg import neg, neg_ 

257from flag_gems.ops.new_full import new_full 

258from flag_gems.ops.nll_loss_nd import nll_loss_nd_backward, nll_loss_nd_forward 

259from flag_gems.ops.nllloss import ( 

260 nll_loss2d_backward, 

261 nll_loss2d_forward, 

262 nll_loss_backward, 

263 nll_loss_forward, 

264) 

265from flag_gems.ops.nonzero import nonzero 

266from flag_gems.ops.nonzero_numpy import nonzero_numpy 

267from flag_gems.ops.normal import ( 

268 normal_, 

269 normal_float_tensor, 

270 normal_tensor_float, 

271 normal_tensor_tensor, 

272) 

273from flag_gems.ops.one_hot import one_hot 

274from flag_gems.ops.ones import ones 

275from flag_gems.ops.ones_like import ones_like 

276from flag_gems.ops.pad import constant_pad_nd, pad 

277from flag_gems.ops.per_token_group_quant_fp8 import ( 

278 SUPPORTED_FP8_DTYPE, 

279 per_token_group_quant_fp8, 

280) 

281from flag_gems.ops.pixel_shuffle import pixel_shuffle 

282from flag_gems.ops.pixel_unshuffle import pixel_unshuffle, pixel_unshuffle_out 

283from flag_gems.ops.poisson import poisson 

284from flag_gems.ops.polar import polar 

285from flag_gems.ops.pow import ( 

286 pow_scalar, 

287 pow_tensor_scalar, 

288 pow_tensor_scalar_, 

289 pow_tensor_tensor, 

290 pow_tensor_tensor_, 

291) 

292from flag_gems.ops.prelu import prelu 

293from flag_gems.ops.prod import prod, prod_dim 

294from flag_gems.ops.quantile import quantile 

295from flag_gems.ops.rad2deg import rad2deg, rad2deg_ 

296from flag_gems.ops.rand import rand 

297from flag_gems.ops.rand_like import rand_like 

298from flag_gems.ops.randint import randint 

299from flag_gems.ops.randint_like import randint_like 

300from flag_gems.ops.randn import randn 

301from flag_gems.ops.randn_like import randn_like 

302from flag_gems.ops.randperm import randperm 

303from flag_gems.ops.reciprocal import reciprocal, reciprocal_ 

304from flag_gems.ops.reflection_pad1d import reflection_pad1d, reflection_pad1d_out 

305from flag_gems.ops.reflection_pad1d_backward import reflection_pad1d_backward 

306from flag_gems.ops.reflection_pad2d import reflection_pad2d, reflection_pad2d_out 

307from flag_gems.ops.relu import relu, relu_ 

308from flag_gems.ops.relu6 import relu6 

309from flag_gems.ops.remainder import remainder, remainder_ 

310from flag_gems.ops.renorm import renorm, renorm_ 

311from flag_gems.ops.repeat import repeat 

312from flag_gems.ops.repeat_interleave import ( 

313 repeat_interleave_self_int, 

314 repeat_interleave_self_tensor, 

315 repeat_interleave_tensor, 

316) 

317from flag_gems.ops.replication_pad1d import replication_pad1d, replication_pad1d_out 

318from flag_gems.ops.replication_pad3d import replication_pad3d 

319from flag_gems.ops.resolve_conj import resolve_conj 

320from flag_gems.ops.resolve_neg import resolve_neg 

321from flag_gems.ops.rms_norm import rms_norm, rms_norm_backward, rms_norm_forward 

322from flag_gems.ops.roll import roll 

323from flag_gems.ops.rot90 import rot90 

324from flag_gems.ops.round import round, round_, round_out 

325from flag_gems.ops.rrelu_with_noise_backward import rrelu_with_noise_backward 

326from flag_gems.ops.rsqrt import rsqrt, rsqrt_ 

327from flag_gems.ops.rsub import rsub_scalar, rsub_tensor 

328from flag_gems.ops.scaled_mm import scaled_mm, scaled_mm_out 

329from flag_gems.ops.scaled_softmax import scaled_softmax_backward, scaled_softmax_forward 

330from flag_gems.ops.scatter import scatter, scatter_ 

331from flag_gems.ops.scatter_add_ import scatter_add_ 

332from flag_gems.ops.scatter_reduce import ( 

333 scatter_reduce, 

334 scatter_reduce_, 

335 scatter_reduce_out, 

336) 

337from flag_gems.ops.searchsorted import ( 

338 searchsorted, 

339 searchsorted_out, 

340 searchsorted_scalar, 

341 searchsorted_scalar_out, 

342) 

343from flag_gems.ops.segment_reduce import ( 

344 _segment_reduce_backward, 

345 _segment_reduce_backward_out, 

346 segment_reduce, 

347 segment_reduce_out, 

348) 

349from flag_gems.ops.select_backward import select_backward 

350from flag_gems.ops.select_scatter import select_scatter 

351from flag_gems.ops.selu import selu 

352from flag_gems.ops.selu_ import selu_ 

353from flag_gems.ops.sgn_ import sgn_ 

354from flag_gems.ops.sigmoid import sigmoid, sigmoid_, sigmoid_backward 

355from flag_gems.ops.signbit import signbit, signbit_out 

356from flag_gems.ops.silu import silu, silu_, silu_backward 

357from flag_gems.ops.sin import sin, sin_ 

358from flag_gems.ops.sinh_ import sinh_ 

359from flag_gems.ops.slice_backward import slice_backward 

360from flag_gems.ops.slice_scatter import slice_scatter 

361from flag_gems.ops.smooth_l1_loss import ( 

362 smooth_l1_loss, 

363 smooth_l1_loss_backward, 

364 smooth_l1_loss_out, 

365) 

366from flag_gems.ops.soft_margin_loss import soft_margin_loss, soft_margin_loss_out 

367from flag_gems.ops.softmax import ( 

368 softmax, 

369 softmax_backward, 

370 softmax_backward_out, 

371 softmax_out, 

372) 

373from flag_gems.ops.softplus import softplus 

374from flag_gems.ops.softshrink import softshrink, softshrink_out 

375from flag_gems.ops.sort import sort, sort_stable 

376from flag_gems.ops.special_i0e import special_i0e, special_i0e_out 

377from flag_gems.ops.special_i1 import special_i1, special_i1_out 

378from flag_gems.ops.split_with_sizes_copy import split_with_sizes_copy 

379from flag_gems.ops.sqrt import sqrt, sqrt_ 

380from flag_gems.ops.square import square, square_, square_out 

381from flag_gems.ops.stack import stack 

382from flag_gems.ops.std import std 

383from flag_gems.ops.sub import sub, sub_ 

384from flag_gems.ops.sum import sum, sum_dim, sum_dim_out, sum_out 

385from flag_gems.ops.svd import svd 

386from flag_gems.ops.t_copy import t_copy, t_copy_out 

387from flag_gems.ops.tan import tan, tan_ 

388from flag_gems.ops.tanh import tanh, tanh_, tanh_backward 

389from flag_gems.ops.tensor_split import tensor_split 

390from flag_gems.ops.threshold import threshold, threshold_backward 

391from flag_gems.ops.tile import tile 

392from flag_gems.ops.to import to_copy 

393from flag_gems.ops.topk import topk 

394from flag_gems.ops.trace import trace 

395from flag_gems.ops.tril import tril, tril_, tril_out 

396from flag_gems.ops.triu import triu, triu_ 

397from flag_gems.ops.unfold_backward import unfold_backward 

398from flag_gems.ops.uniform import uniform_ 

399from flag_gems.ops.unique import _unique2 

400from flag_gems.ops.unique_consecutive import unique_consecutive 

401from flag_gems.ops.unique_dim import unique_dim 

402from flag_gems.ops.upsample_bicubic2d import upsample_bicubic2d 

403from flag_gems.ops.upsample_bicubic2d_aa import _upsample_bicubic2d_aa 

404from flag_gems.ops.upsample_bicubic2d_aa_backward import _upsample_bicubic2d_aa_backward 

405from flag_gems.ops.upsample_linear1d import upsample_linear1d 

406from flag_gems.ops.upsample_linear1d_backward import upsample_linear1d_backward 

407from flag_gems.ops.upsample_nearest1d import upsample_nearest1d 

408from flag_gems.ops.upsample_nearest2d import upsample_nearest2d 

409from flag_gems.ops.upsample_nearest3d import upsample_nearest3d 

410from flag_gems.ops.upsample_trilinear3d import upsample_trilinear3d 

411from flag_gems.ops.var import var, var_correction, var_dim 

412from flag_gems.ops.var_mean import var_mean 

413from flag_gems.ops.vdot import vdot 

414from flag_gems.ops.vector_norm import vector_norm 

415from flag_gems.ops.view_copy import view_copy 

416from flag_gems.ops.vstack import vstack 

417from flag_gems.ops.w8a8_block_fp8_matmul import w8a8_block_fp8_matmul 

418from flag_gems.ops.weightnorm import ( 

419 weight_norm_interface, 

420 weight_norm_interface_backward, 

421) 

422from flag_gems.ops.where import ( 

423 where_scalar_other, 

424 where_scalar_self, 

425 where_self, 

426 where_self_out, 

427) 

428from flag_gems.ops.zero import zero, zero_out 

429from flag_gems.ops.zeros import zero_, zeros 

430from flag_gems.ops.zeros_like import zeros_like 

431 

432__all__ = [ 

433 "SUPPORTED_FP8_DTYPE", 

434 "ScaleDotProductAttention", 

435 "_assert_async", 

436 "_conv_depthwise2d", 

437 "_euclidean_dist", 

438 "_functional_sym_constrain_range_for_size", 

439 "_index_put_impl_", 

440 "_is_all_true", 

441 "_safe_softmax", 

442 "_segment_reduce_backward", 

443 "_segment_reduce_backward_out", 

444 "_unique2", 

445 "_upsample_bicubic2d_aa", 

446 "_upsample_bicubic2d_aa_backward", 

447 "_upsample_nearest_exact1d", 

448 "abs", 

449 "abs_", 

450 "absolute", 

451 "acos", 

452 "act_quant_triton", 

453 "add", 

454 "add_", 

455 "addcdiv", 

456 "addcdiv_out", 

457 "addcmul", 

458 "addcmul_out", 

459 "addmm", 

460 "addmm_dtype", 

461 "addmm_dtype_out", 

462 "addmm_out", 

463 "addmv", 

464 "addmv_out", 

465 "addr", 

466 "affine_grid_generator", 

467 "alias_copy", 

468 "alias_copy_out", 

469 "all", 

470 "all_dim", 

471 "all_dims", 

472 "allclose", 

473 "amax", 

474 "aminmax", 

475 "angle", 

476 "any", 

477 "any_dim", 

478 "any_dims", 

479 "arange", 

480 "arange_start", 

481 "arcsinh", 

482 "arcsinh_", 

483 "arcsinh_out", 

484 "arctanh_", 

485 "argmax", 

486 "argmin", 

487 "argsort", 

488 "as_strided_copy", 

489 "as_strided_copy_out", 

490 "asinh", 

491 "asinh_", 

492 "asinh_out", 

493 "atan", 

494 "atan2", 

495 "atan2_out", 

496 "atan_", 

497 "atanh", 

498 "atanh_", 

499 "avg_pool2d", 

500 "avg_pool2d_backward", 

501 "avg_pool3d", 

502 "avg_pool3d_backward", 

503 "baddbmm", 

504 "baddbmm_out", 

505 "batch_norm", 

506 "batch_norm_backward", 

507 "bernoulli_", 

508 "bincount", 

509 "bitwise_and_scalar", 

510 "bitwise_and_scalar_", 

511 "bitwise_and_scalar_tensor", 

512 "bitwise_and_tensor", 

513 "bitwise_and_tensor_", 

514 "bitwise_left_shift", 

515 "bitwise_not", 

516 "bitwise_not_", 

517 "bitwise_or_scalar", 

518 "bitwise_or_scalar_", 

519 "bitwise_or_scalar_tensor", 

520 "bitwise_or_tensor", 

521 "bitwise_or_tensor_", 

522 "bitwise_right_shift", 

523 "bmm", 

524 "bmm_out", 

525 "cat", 

526 "cat_out", 

527 "cauchy", 

528 "cauchy_", 

529 "ceil", 

530 "ceil_", 

531 "ceil_out", 

532 "celu", 

533 "celu_", 

534 "clamp", 

535 "clamp_", 

536 "clamp_max", 

537 "clamp_max_", 

538 "clamp_min", 

539 "clamp_min_", 

540 "clamp_tensor", 

541 "clamp_tensor_", 

542 "clip", 

543 "clip_", 

544 "col2im", 

545 "concatenate", 

546 "conj_physical", 

547 "constant_pad_nd", 

548 "contiguous", 

549 "conv1d", 

550 "conv2d", 

551 "conv3d", 

552 "conv_transpose1d", 

553 "conv_transpose2d", 

554 "copy", 

555 "copy_", 

556 "copysign", 

557 "copysign_out", 

558 "cos", 

559 "cos_", 

560 "cosh", 

561 "cosh_", 

562 "cosh_out", 

563 "count_nonzero", 

564 "ctc_loss", 

565 "cudnn_convolution", 

566 "cummax", 

567 "cummin", 

568 "cumprod", 

569 "cumprod_", 

570 "cumsum", 

571 "cumsum_out", 

572 "diag", 

573 "diag_embed", 

574 "diagonal_backward", 

575 "diff", 

576 "digamma_", 

577 "div_mode", 

578 "div_mode_", 

579 "dot", 

580 "dropout", 

581 "dropout_backward", 

582 "elu", 

583 "elu_", 

584 "elu_backward", 

585 "embedding", 

586 "embedding_backward", 

587 "embedding_dense_backward", 

588 "eq", 

589 "eq_scalar", 

590 "equal", 

591 "erf", 

592 "erf_", 

593 "exp", 

594 "exp2", 

595 "exp2_", 

596 "exp_", 

597 "exp_out", 

598 "expm1", 

599 "expm1_", 

600 "expm1_out", 

601 "exponential_", 

602 "eye", 

603 "eye_m", 

604 "feature_dropout", 

605 "feature_dropout_", 

606 "fft", 

607 "fill_scalar", 

608 "fill_scalar_", 

609 "fill_scalar_out", 

610 "fill_tensor", 

611 "fill_tensor_", 

612 "fill_tensor_out", 

613 "flash_attention_forward", 

614 "flash_attn_varlen_func", 

615 "flash_attn_varlen_opt_func", 

616 "flip", 

617 "floor", 

618 "floor_", 

619 "floor_divide", 

620 "floor_divide_", 

621 "floor_out", 

622 "fmin", 

623 "fmin_out", 

624 "fmod_", 

625 "fmod_scalar", 

626 "fmod_scalar_", 

627 "fmod_tensor", 

628 "fmod_tensor_", 

629 "fp8_matmul", 

630 "fp8_mqa_logits", 

631 "full", 

632 "full_like", 

633 "gather", 

634 "gather_backward", 

635 "gcd", 

636 "gcd_out", 

637 "ge", 

638 "ge_scalar", 

639 "gelu", 

640 "gelu_", 

641 "gelu_backward", 

642 "get_paged_mqa_logits_metadata", 

643 "get_scheduler_metadata", 

644 "glu", 

645 "glu_backward", 

646 "greater", 

647 "greater_out", 

648 "greater_scalar", 

649 "greater_scalar_out", 

650 "grid_sample", 

651 "group_mm", 

652 "group_norm", 

653 "group_norm_backward", 

654 "gt", 

655 "gt_scalar", 

656 "hadamard_transform", 

657 "hadamard_transform_12N", 

658 "hadamard_transform_20N", 

659 "hadamard_transform_28N", 

660 "hadamard_transform_40N", 

661 "hardsigmoid", 

662 "hardsigmoid_out", 

663 "hardswish_", 

664 "histc", 

665 "hstack", 

666 "hypot", 

667 "hypot_out", 

668 "i0", 

669 "i0_", 

670 "i0_out", 

671 "index", 

672 "index_add", 

673 "index_add_", 

674 "index_copy", 

675 "index_copy_", 

676 "index_put", 

677 "index_put_", 

678 "index_reduce_", 

679 "index_select", 

680 "isclose", 

681 "isfinite", 

682 "isin", 

683 "isinf", 

684 "isnan", 

685 "isneginf", 

686 "isneginf_out", 

687 "kron", 

688 "layer_norm", 

689 "layer_norm_backward", 

690 "le", 

691 "le_scalar", 

692 "leaky_relu", 

693 "leaky_relu_", 

694 "leaky_relu_out", 

695 "lerp_scalar", 

696 "lerp_scalar_", 

697 "lerp_tensor", 

698 "lerp_tensor_", 

699 "lift_fresh_copy", 

700 "lift_fresh_copy_out", 

701 "linspace", 

702 "log", 

703 "log10", 

704 "log10_", 

705 "log10_out", 

706 "log1p", 

707 "log1p_", 

708 "log1p_out", 

709 "log_sigmoid", 

710 "log_softmax", 

711 "log_softmax_backward", 

712 "log_softmax_backward_out", 

713 "log_softmax_out", 

714 "logaddexp", 

715 "logaddexp_out", 

716 "logical_and", 

717 "logical_and_", 

718 "logical_not", 

719 "logical_or", 

720 "logical_or_", 

721 "logical_xor", 

722 "logit", 

723 "logit_", 

724 "logit_out", 

725 "logspace", 

726 "logsumexp", 

727 "lt", 

728 "lt_scalar", 

729 "margin_ranking_loss", 

730 "masked_fill", 

731 "masked_fill_", 

732 "masked_scatter", 

733 "masked_scatter_", 

734 "masked_select", 

735 "max", 

736 "max_dim", 

737 "max_pool2d_backward", 

738 "max_pool2d_with_indices", 

739 "max_pool3d_backward", 

740 "max_pool3d_with_indices", 

741 "maximum", 

742 "mean", 

743 "mean_dim", 

744 "median", 

745 "median_dim", 

746 "median_dim_values", 

747 "median_out", 

748 "min", 

749 "min_dim", 

750 "minimum", 

751 "mm", 

752 "mm_out", 

753 "mse_loss", 

754 "mul", 

755 "mul_", 

756 "multinomial", 

757 "mv", 

758 "nan_to_num", 

759 "nanmedian", 

760 "nanmedian_dim", 

761 "nanmedian_dim_values", 

762 "nanmedian_out", 

763 "ne", 

764 "ne_scalar", 

765 "neg", 

766 "neg_", 

767 "new_full", 

768 "nll_loss2d_backward", 

769 "nll_loss2d_forward", 

770 "nll_loss_backward", 

771 "nll_loss_forward", 

772 "nll_loss_nd_backward", 

773 "nll_loss_nd_forward", 

774 "nonzero", 

775 "nonzero_numpy", 

776 "normal_", 

777 "normal_float_tensor", 

778 "normal_tensor_float", 

779 "normal_tensor_tensor", 

780 "normed_cumsum", 

781 "one_hot", 

782 "ones", 

783 "ones_like", 

784 "pad", 

785 "per_token_group_quant_fp8", 

786 "pixel_shuffle", 

787 "pixel_unshuffle", 

788 "pixel_unshuffle_out", 

789 "poisson", 

790 "polar", 

791 "pow_scalar", 

792 "pow_tensor_scalar", 

793 "pow_tensor_scalar_", 

794 "pow_tensor_tensor", 

795 "pow_tensor_tensor_", 

796 "prelu", 

797 "prod", 

798 "prod_dim", 

799 "quantile", 

800 "rad2deg", 

801 "rad2deg_", 

802 "rand", 

803 "rand_like", 

804 "randint", 

805 "randint_like", 

806 "randn", 

807 "randn_like", 

808 "randperm", 

809 "reciprocal", 

810 "reciprocal_", 

811 "reflection_pad1d", 

812 "reflection_pad1d_backward", 

813 "reflection_pad1d_out", 

814 "reflection_pad2d", 

815 "reflection_pad2d_out", 

816 "relu", 

817 "relu6", 

818 "relu_", 

819 "remainder", 

820 "remainder_", 

821 "renorm", 

822 "renorm_", 

823 "repeat", 

824 "repeat_interleave_self_int", 

825 "repeat_interleave_self_tensor", 

826 "repeat_interleave_tensor", 

827 "replication_pad1d", 

828 "replication_pad1d_out", 

829 "replication_pad3d", 

830 "resolve_conj", 

831 "resolve_neg", 

832 "rms_norm", 

833 "rms_norm_backward", 

834 "rms_norm_forward", 

835 "roll", 

836 "rot90", 

837 "round", 

838 "round_", 

839 "round_out", 

840 "router_gemm", 

841 "rrelu_with_noise_backward", 

842 "rsqrt", 

843 "rsqrt_", 

844 "rsub_scalar", 

845 "rsub_tensor", 

846 "scaled_dot_product_attention", 

847 "scaled_dot_product_attention_backward", 

848 "scaled_dot_product_attention_forward", 

849 "scaled_mm", 

850 "scaled_mm_out", 

851 "scaled_softmax_backward", 

852 "scaled_softmax_forward", 

853 "scatter", 

854 "scatter_", 

855 "scatter_add_", 

856 "scatter_reduce", 

857 "scatter_reduce_", 

858 "scatter_reduce_out", 

859 "searchsorted", 

860 "searchsorted_out", 

861 "searchsorted_scalar", 

862 "searchsorted_scalar_out", 

863 "segment_reduce", 

864 "segment_reduce_out", 

865 "select_backward", 

866 "select_scatter", 

867 "selu", 

868 "selu_", 

869 "sgn_", 

870 "sigmoid", 

871 "sigmoid_", 

872 "sigmoid_backward", 

873 "signbit", 

874 "signbit_out", 

875 "silu", 

876 "silu_", 

877 "silu_backward", 

878 "sin", 

879 "sin_", 

880 "sinh_", 

881 "slice_backward", 

882 "slice_scatter", 

883 "smooth_l1_loss", 

884 "smooth_l1_loss_backward", 

885 "smooth_l1_loss_out", 

886 "soft_margin_loss", 

887 "soft_margin_loss_out", 

888 "softmax", 

889 "softmax_backward", 

890 "softmax_backward_out", 

891 "softmax_out", 

892 "softplus", 

893 "softshrink", 

894 "softshrink_out", 

895 "sort", 

896 "sort_stable", 

897 "special_i0e", 

898 "special_i0e_out", 

899 "special_i1", 

900 "special_i1_out", 

901 "split_with_sizes_copy", 

902 "sqrt", 

903 "sqrt_", 

904 "square", 

905 "square_", 

906 "square_out", 

907 "stack", 

908 "std", 

909 "sub", 

910 "sub_", 

911 "sum", 

912 "sum_dim", 

913 "sum_dim_out", 

914 "sum_out", 

915 "svd", 

916 "t_copy", 

917 "t_copy_out", 

918 "tan", 

919 "tan_", 

920 "tanh", 

921 "tanh_", 

922 "tanh_backward", 

923 "tensor_split", 

924 "threshold", 

925 "threshold_backward", 

926 "tile", 

927 "to_copy", 

928 "topk", 

929 "trace", 

930 "tril", 

931 "tril_", 

932 "tril_out", 

933 "triu", 

934 "triu_", 

935 "true_divide", 

936 "true_divide_", 

937 "true_divide_out", 

938 "unfold_backward", 

939 "uniform_", 

940 "unique_consecutive", 

941 "unique_dim", 

942 "upsample_bicubic2d", 

943 "upsample_linear1d", 

944 "upsample_linear1d_backward", 

945 "upsample_nearest1d", 

946 "upsample_nearest2d", 

947 "upsample_nearest3d", 

948 "upsample_trilinear3d", 

949 "var", 

950 "var_correction", 

951 "var_dim", 

952 "var_mean", 

953 "vdot", 

954 "vector_norm", 

955 "view_copy", 

956 "vstack", 

957 "w8a8_block_fp8_matmul", 

958 "weight_norm_interface", 

959 "weight_norm_interface_backward", 

960 "where_scalar_other", 

961 "where_scalar_self", 

962 "where_self", 

963 "where_self_out", 

964 "zero", 

965 "zero_", 

966 "zero_out", 

967 "zeros", 

968 "zeros_like", 

969]