[CUDA] Affine quantize (#2354)

* affine quantize and dequantize kernels * format * fix * format
2025-12-11 23:14:50 +08:00 · 2025-07-14 15:45:44 -07:00
parent e569803d7c
commit e7d2ebadd2
4 changed files with 384 additions and 2 deletions
--- a/python/tests/cuda_skip.py
+++ b/python/tests/cuda_skip.py
@@ -83,7 +83,6 @@ cuda_skip = {
    "TestQuantized.test_qmm_shapes",
    "TestQuantized.test_qmm_vjp",
    "TestQuantized.test_qmv",
-    "TestQuantized.test_quantize_dequantize",
    "TestQuantized.test_qvm",
    "TestQuantized.test_qvm_splitk",
    "TestQuantized.test_small_matrix",