Skip to content
1 change: 0 additions & 1 deletion backends/cuda/tests/test_int4_matmul.py
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,6 @@
import unittest

import torch
import torch.nn as nn

from executorch.backends.cuda.triton.kernels.int4_matmul import (
dequant_w4_to_bf16,
Expand Down
3 changes: 3 additions & 0 deletions backends/cuda/triton/kernels/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@
fused_moe,
fused_moe_batched,
fused_moe_batched_gemm,
fused_moe_batched_gemm_int8,
moe_align_block_size,
)

Expand All @@ -23,6 +24,8 @@
"fused_moe",
"fused_moe_batched",
"fused_moe_batched_gemm",
"fused_moe_batched_gemm_int8",
"int4_matvec",
"moe_align_block_size",
"sdpa",
"sdpa_decode_splitk",
Expand Down
Loading
Loading