[CUDA] Affine quantize (#2354)

* affine quantize and dequantize kernels * format * fix * format
2025-12-16 01:49:05 +08:00 · 2025-07-14 15:45:44 -07:00
parent e569803d7c
commit e7d2ebadd2
4 changed files with 384 additions and 2 deletions
--- a/mlx/backend/cuda/CMakeLists.txt
+++ b/mlx/backend/cuda/CMakeLists.txt
@@ -42,6 +42,7 @@ target_sources(
          ${CMAKE_CURRENT_SOURCE_DIR}/ternary.cu
          ${CMAKE_CURRENT_SOURCE_DIR}/unary.cu
          ${CMAKE_CURRENT_SOURCE_DIR}/utils.cpp
+          ${CMAKE_CURRENT_SOURCE_DIR}/quantized.cu
          ${CMAKE_CURRENT_SOURCE_DIR}/worker.cpp)

 target_compile_definitions(mlx PRIVATE MLX_USE_CUDA)