Coverage for src/flag_gems/runtime/backend/_kunlunxin/ops/__init__.py: 0%

170 statements  

« prev     ^ index     » next       coverage.py v7.6.9, created at 2026-03-16 02:02 +0800

1from .abs import abs, abs_ 

2from .acos import acos 

3from .add import add, add_ 

4from .addcdiv import addcdiv 

5from .addcmul import addcmul 

6from .addmm import addmm, addmm_out 

7from .addmv import addmv, addmv_out 

8from .addr import addr 

9from .all import all, all_dim, all_dims 

10from .amax import amax 

11from .angle import angle 

12from .any import any, any_dim, any_dims 

13from .arange import arange, arange_start 

14from .argmax import argmax 

15from .argmin import argmin 

16from .atan import atan, atan_ 

17from .attention import ( 

18 ScaleDotProductAttention, 

19 flash_attention_forward, 

20 flash_attn_varlen_func, 

21 scaled_dot_product_attention, 

22 scaled_dot_product_attention_backward, 

23 scaled_dot_product_attention_forward, 

24) 

25from .avg_pool2d import avg_pool2d, avg_pool2d_backward 

26from .baddbmm import baddbmm 

27from .batch_norm import batch_norm, batch_norm_backward 

28from .bitwise_and import ( 

29 bitwise_and_scalar, 

30 bitwise_and_scalar_, 

31 bitwise_and_scalar_tensor, 

32 bitwise_and_tensor, 

33 bitwise_and_tensor_, 

34) 

35from .bitwise_left_shift import bitwise_left_shift 

36from .bitwise_not import bitwise_not, bitwise_not_ 

37from .bitwise_or import ( 

38 bitwise_or_scalar, 

39 bitwise_or_scalar_, 

40 bitwise_or_scalar_tensor, 

41 bitwise_or_tensor, 

42 bitwise_or_tensor_, 

43) 

44from .bitwise_right_shift import bitwise_right_shift 

45from .bmm import bmm, bmm_out 

46from .cat import cat 

47from .celu import celu, celu_ 

48from .clamp import clamp, clamp_, clamp_min, clamp_min_, clamp_tensor, clamp_tensor_ 

49from .contiguous import contiguous 

50from .conv1d import conv1d 

51from .conv2d import conv2d 

52from .conv3d import conv3d 

53from .conv_depthwise2d import _conv_depthwise2d 

54from .copy import copy, copy_ 

55from .cos import cos, cos_ 

56from .count_nonzero import count_nonzero 

57from .cummax import cummax 

58from .cummin import cummin 

59from .cumsum import cumsum, cumsum_out, normed_cumsum 

60from .diag import diag 

61from .diag_embed import diag_embed 

62from .diagonal import diagonal_backward 

63from .div import ( 

64 div_mode, 

65 div_mode_, 

66 floor_divide, 

67 floor_divide_, 

68 remainder, 

69 remainder_, 

70 true_divide, 

71 true_divide_, 

72 true_divide_out, 

73) 

74from .dot import dot 

75from .dropout import dropout, dropout_backward 

76from .elu import elu, elu_, elu_backward 

77from .embedding import embedding, embedding_backward 

78from .eq import eq, eq_scalar 

79from .erf import erf, erf_ 

80from .exp import exp, exp_, exp_out 

81from .exp2 import exp2, exp2_ 

82from .exponential_ import exponential_ 

83from .eye import eye 

84from .eye_m import eye_m 

85from .fill import fill_scalar, fill_scalar_, fill_tensor, fill_tensor_ 

86from .flip import flip 

87from .full import full 

88from .full_like import full_like 

89from .gather import gather, gather_backward 

90from .ge import ge, ge_scalar 

91from .gelu import gelu, gelu_, gelu_backward 

92from .get_scheduler_metadata import get_scheduler_metadata 

93from .glu import glu, glu_backward 

94from .groupnorm import group_norm, group_norm_backward 

95from .gt import gt, gt_scalar 

96from .hstack import hstack 

97from .index import index 

98from .index_add import index_add, index_add_ 

99from .index_put import index_put, index_put_ 

100from .index_select import index_select 

101from .isclose import allclose, isclose 

102from .isfinite import isfinite 

103from .isin import isin 

104from .isinf import isinf 

105from .isnan import isnan 

106from .kron import kron 

107from .layernorm import layer_norm, layer_norm_backward 

108from .le import le, le_scalar 

109from .lerp import lerp_scalar, lerp_scalar_, lerp_tensor, lerp_tensor_ 

110from .linspace import linspace 

111from .log import log 

112from .log_sigmoid import log_sigmoid 

113from .log_softmax import log_softmax, log_softmax_backward 

114from .logical_and import logical_and 

115from .logical_not import logical_not 

116from .logical_or import logical_or 

117from .logical_xor import logical_xor 

118from .logspace import logspace 

119from .lt import lt, lt_scalar 

120from .masked_fill import masked_fill, masked_fill_ 

121from .masked_scatter import masked_scatter, masked_scatter_ 

122from .masked_select import masked_select 

123from .max import max, max_dim 

124from .max_pool2d_with_indices import max_pool2d_backward, max_pool2d_with_indices 

125from .maximum import maximum 

126from .mean import mean, mean_dim 

127from .min import min, min_dim 

128from .minimum import minimum 

129from .mm import mm, mm_out 

130from .mse_loss import mse_loss 

131from .mul import mul, mul_ 

132from .multinomial import multinomial 

133from .mv import mv, mv_cluster 

134from .nan_to_num import nan_to_num 

135from .ne import ne, ne_scalar 

136from .neg import neg, neg_ 

137from .nllloss import ( 

138 nll_loss2d_backward, 

139 nll_loss2d_forward, 

140 nll_loss_backward, 

141 nll_loss_forward, 

142) 

143from .nonzero import nonzero 

144from .normal import normal_float_tensor, normal_tensor_float, normal_tensor_tensor 

145from .ones import ones 

146from .ones_like import ones_like 

147from .pad import constant_pad_nd, pad 

148from .per_token_group_quant_fp8 import SUPPORTED_FP8_DTYPE, per_token_group_quant_fp8 

149from .polar import polar 

150from .pow import ( 

151 pow_scalar, 

152 pow_tensor_scalar, 

153 pow_tensor_scalar_, 

154 pow_tensor_tensor, 

155 pow_tensor_tensor_, 

156) 

157from .prod import prod, prod_dim 

158from .quantile import quantile 

159from .rand import rand 

160from .rand_like import rand_like 

161from .randn import randn 

162from .randn_like import randn_like 

163from .randperm import randperm 

164from .reciprocal import reciprocal, reciprocal_ 

165from .relu import relu, relu_ 

166from .repeat import repeat 

167from .repeat_interleave import ( 

168 repeat_interleave_self_int, 

169 repeat_interleave_self_tensor, 

170 repeat_interleave_tensor, 

171) 

172from .resolve_conj import resolve_conj 

173from .resolve_neg import resolve_neg 

174from .rms_norm import rms_norm, rms_norm_backward, rms_norm_forward 

175from .rsqrt import rsqrt, rsqrt_ 

176from .rsub import rsub 

177from .scaled_softmax import scaled_softmax_backward, scaled_softmax_forward 

178from .scatter import scatter, scatter_ 

179from .scatter_add_ import scatter_add_ 

180from .select_scatter import select_scatter 

181from .sigmoid import sigmoid, sigmoid_, sigmoid_backward 

182from .silu import silu, silu_, silu_backward 

183from .sin import sin, sin_ 

184from .slice_scatter import slice_scatter 

185from .softmax import softmax, softmax_backward 

186from .softplus import softplus 

187from .sort import sort, sort_stable 

188from .sqrt import sqrt, sqrt_ 

189from .stack import stack 

190from .std import std 

191from .sub import sub, sub_ 

192from .sum import sum, sum_dim, sum_dim_out, sum_out 

193from .tan import tan, tan_ 

194from .tanh import tanh, tanh_, tanh_backward 

195from .threshold import threshold, threshold_backward 

196from .tile import tile 

197from .to import to_copy 

198from .topk import topk 

199from .trace import trace 

200from .triu import triu 

201from .uniform import uniform_ 

202from .unique import _unique2 

203from .upsample_bicubic2d_aa import _upsample_bicubic2d_aa 

204from .upsample_nearest1d import upsample_nearest1d 

205from .upsample_nearest2d import upsample_nearest2d 

206from .var_mean import var_mean 

207from .vdot import vdot 

208from .vector_norm import vector_norm 

209from .vstack import vstack 

210from .weightnorm import weight_norm_interface, weight_norm_interface_backward 

211from .where import where_scalar_other, where_scalar_self, where_self, where_self_out 

212from .zeros import zeros 

213from .zeros_like import zeros_like 

214 

215__all__ = [ 

216 "_conv_depthwise2d", 

217 "_unique2", 

218 "_upsample_bicubic2d_aa", 

219 "abs", 

220 "abs_", 

221 "acos", 

222 "add", 

223 "add_", 

224 "addcdiv", 

225 "addcmul", 

226 "addmm", 

227 "addmm_out", 

228 "addmv", 

229 "addmv_out", 

230 "addr", 

231 "all", 

232 "all_dim", 

233 "all_dims", 

234 "allclose", 

235 "amax", 

236 "angle", 

237 "any", 

238 "any_dim", 

239 "any_dims", 

240 "arange", 

241 "arange_start", 

242 "argmax", 

243 "argmin", 

244 "avg_pool2d", 

245 "avg_pool2d_backward", 

246 "atan", 

247 "atan_", 

248 "baddbmm", 

249 "batch_norm", 

250 "batch_norm_backward", 

251 "bitwise_and_scalar", 

252 "bitwise_and_scalar_", 

253 "bitwise_and_scalar_tensor", 

254 "bitwise_and_tensor", 

255 "bitwise_and_tensor_", 

256 "bitwise_left_shift", 

257 "bitwise_right_shift", 

258 "bitwise_not", 

259 "bitwise_not_", 

260 "bitwise_or_scalar", 

261 "bitwise_or_scalar_", 

262 "bitwise_or_scalar_tensor", 

263 "bitwise_or_tensor", 

264 "bitwise_or_tensor_", 

265 "bmm", 

266 "bmm_out", 

267 "cat", 

268 "celu", 

269 "celu_", 

270 "clamp", 

271 "clamp_", 

272 "clamp_tensor", 

273 "clamp_tensor_", 

274 "clamp_min", 

275 "clamp_min_", 

276 "constant_pad_nd", 

277 "contiguous", 

278 "conv1d", 

279 "conv2d", 

280 "conv3d", 

281 "copy", 

282 "copy_", 

283 "cos", 

284 "cos_", 

285 "count_nonzero", 

286 "cummax", 

287 "cummin", 

288 "cumsum", 

289 "cumsum_out", 

290 "diag", 

291 "diag_embed", 

292 "diagonal_backward", 

293 "div_mode", 

294 "div_mode_", 

295 "dot", 

296 "dropout", 

297 "dropout_backward", 

298 "elu", 

299 "elu_", 

300 "elu_backward", 

301 "embedding", 

302 "embedding_backward", 

303 "eq", 

304 "eq_scalar", 

305 "erf", 

306 "erf_", 

307 "exp", 

308 "exp_", 

309 "exp_out", 

310 "exp2", 

311 "exp2_", 

312 "exponential_", 

313 "eye", 

314 "eye_m", 

315 "fill_scalar", 

316 "fill_scalar_", 

317 "fill_tensor", 

318 "fill_tensor_", 

319 "flash_attention_forward", 

320 "flash_attn_varlen_func", 

321 "flip", 

322 "floor_divide", 

323 "floor_divide_", 

324 "full", 

325 "full_like", 

326 "gather", 

327 "gather_backward", 

328 "ge", 

329 "ge_scalar", 

330 "gelu", 

331 "gelu_", 

332 "gelu_backward", 

333 "get_scheduler_metadata", 

334 "glu", 

335 "glu_backward", 

336 "group_norm", 

337 "group_norm_backward", 

338 "gt", 

339 "gt_scalar", 

340 "hstack", 

341 "index", 

342 "index_add", 

343 "index_add_", 

344 "index_put", 

345 "index_put_", 

346 "index_select", 

347 "isclose", 

348 "isfinite", 

349 "isin", 

350 "isinf", 

351 "isnan", 

352 "kron", 

353 "layer_norm", 

354 "layer_norm_backward", 

355 "le", 

356 "le_scalar", 

357 "lerp_scalar", 

358 "lerp_scalar_", 

359 "lerp_tensor", 

360 "lerp_tensor_", 

361 "linspace", 

362 "log", 

363 "log_sigmoid", 

364 "log_softmax", 

365 "log_softmax_backward", 

366 "logical_and", 

367 "logical_not", 

368 "logical_or", 

369 "logical_xor", 

370 "logspace", 

371 "lt", 

372 "lt_scalar", 

373 "masked_fill", 

374 "masked_fill_", 

375 "masked_scatter", 

376 "masked_scatter_", 

377 "masked_select", 

378 "max", 

379 "max_dim", 

380 "maximum", 

381 "max_pool2d_with_indices", 

382 "max_pool2d_backward", 

383 "mean", 

384 "mean_dim", 

385 "min", 

386 "min_dim", 

387 "minimum", 

388 "mm", 

389 "mm_out", 

390 "mse_loss", 

391 "mul", 

392 "mul_", 

393 "multinomial", 

394 "mv", 

395 "mv_cluster", 

396 "nan_to_num", 

397 "ne", 

398 "ne_scalar", 

399 "neg", 

400 "neg_", 

401 "nll_loss_backward", 

402 "nll_loss_forward", 

403 "nll_loss2d_backward", 

404 "nll_loss2d_forward", 

405 "nonzero", 

406 "normal_float_tensor", 

407 "normal_tensor_float", 

408 "normal_tensor_tensor", 

409 "normed_cumsum", 

410 "ones", 

411 "ones_like", 

412 "pad", 

413 "per_token_group_quant_fp8", 

414 "polar", 

415 "pow_scalar", 

416 "pow_tensor_scalar", 

417 "pow_tensor_scalar_", 

418 "pow_tensor_tensor", 

419 "pow_tensor_tensor_", 

420 "prod", 

421 "prod_dim", 

422 "quantile", 

423 "rand", 

424 "rand_like", 

425 "randn", 

426 "randn_like", 

427 "randperm", 

428 "reciprocal", 

429 "reciprocal_", 

430 "relu", 

431 "relu_", 

432 "remainder", 

433 "remainder_", 

434 "repeat", 

435 "repeat_interleave_self_int", 

436 "repeat_interleave_self_tensor", 

437 "repeat_interleave_tensor", 

438 "resolve_conj", 

439 "resolve_neg", 

440 "rms_norm", 

441 "rms_norm_forward", 

442 "rms_norm_backward", 

443 "sqrt", 

444 "sqrt_", 

445 "rsqrt", 

446 "rsqrt_", 

447 "rsub", 

448 "scaled_dot_product_attention", 

449 "scaled_dot_product_attention_backward", 

450 "scaled_dot_product_attention_forward", 

451 "scaled_softmax_backward", 

452 "scaled_softmax_forward", 

453 "scatter", 

454 "scatter_", 

455 "scatter_add_", 

456 "select_scatter", 

457 "sigmoid", 

458 "sigmoid_", 

459 "sigmoid_backward", 

460 "silu", 

461 "silu_", 

462 "silu_backward", 

463 "sin", 

464 "sin_", 

465 "slice_scatter", 

466 "softmax", 

467 "softmax_backward", 

468 "softplus", 

469 "sort", 

470 "sort_stable", 

471 "stack", 

472 "std", 

473 "sub", 

474 "sub_", 

475 "sum", 

476 "sum_dim", 

477 "sum_dim_out", 

478 "sum_out", 

479 "ScaleDotProductAttention", 

480 "SUPPORTED_FP8_DTYPE", 

481 "tan", 

482 "tan_", 

483 "tanh", 

484 "tanh_", 

485 "tanh_backward", 

486 "threshold", 

487 "threshold_backward", 

488 "tile", 

489 "to_copy", 

490 "topk", 

491 "trace", 

492 "triu", 

493 "true_divide", 

494 "true_divide_out", 

495 "true_divide_", 

496 "uniform_", 

497 "upsample_nearest1d", 

498 "upsample_nearest2d", 

499 "var_mean", 

500 "vdot", 

501 "vector_norm", 

502 "vstack", 

503 "weight_norm_interface", 

504 "weight_norm_interface_backward", 

505 "where_scalar_other", 

506 "where_scalar_self", 

507 "where_self", 

508 "where_self_out", 

509 "zeros", 

510 "zeros_like", 

511]