[CUDA] Affine quantize (#2354)

* affine quantize and dequantize kernels

* format

* fix

* format
This commit is contained in:
Awni Hannun
2025-07-14 15:45:44 -07:00
committed by GitHub
parent e569803d7c
commit e7d2ebadd2
4 changed files with 384 additions and 2 deletions

View File

@@ -83,7 +83,6 @@ cuda_skip = {
"TestQuantized.test_qmm_shapes",
"TestQuantized.test_qmm_vjp",
"TestQuantized.test_qmv",
"TestQuantized.test_quantize_dequantize",
"TestQuantized.test_qvm",
"TestQuantized.test_qvm_splitk",
"TestQuantized.test_small_matrix",