Skip to content

Commit 4b1b88d

Browse files
committed
jit kernel support per-tensor quant
1 parent 8718303 commit 4b1b88d

1 file changed

Lines changed: 0 additions & 4 deletions

File tree

python/sglang/jit_kernel/csrc/gemm/per_tensor_quant_fp8.cuh

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -133,8 +133,6 @@ void per_tensor_quant_fp8(tvm::ffi::TensorView input,
133133
const size_t num_blocks = std::min((total_elements + kBlockSize - 1) / kBlockSize, size_t(1024));
134134
const DLDevice device = device_.unwrap();
135135

136-
RuntimeCheck(total_elements > 0, "Input tensor must be non-empty");
137-
138136
auto launch_kernels = [&]<typename T>() {
139137
if constexpr (!kIsStatic) {
140138
LaunchKernel(num_blocks, kBlockSize, device)(
@@ -159,8 +157,6 @@ void per_tensor_quant_fp8(tvm::ffi::TensorView input,
159157
launch_kernels.template operator()<c10::BFloat16>();
160158
} else if (dtype.code == kDLFloat && dtype.bits == 16) {
161159
launch_kernels.template operator()<c10::Half>();
162-
} else {
163-
RuntimeCheck(false, "Unsupported input dtype");
164160
}
165161
}
166162

0 commit comments

Comments
 (0)