[CUDA] Affine quantize (#2354)

* affine quantize and dequantize kernels

* format

* fix

* format
This commit is contained in:
Awni Hannun
2025-07-14 15:45:44 -07:00
committed by GitHub
parent e569803d7c
commit e7d2ebadd2
4 changed files with 384 additions and 2 deletions

View File

@@ -42,6 +42,7 @@ target_sources(
${CMAKE_CURRENT_SOURCE_DIR}/ternary.cu
${CMAKE_CURRENT_SOURCE_DIR}/unary.cu
${CMAKE_CURRENT_SOURCE_DIR}/utils.cpp
${CMAKE_CURRENT_SOURCE_DIR}/quantized.cu
${CMAKE_CURRENT_SOURCE_DIR}/worker.cpp)
target_compile_definitions(mlx PRIVATE MLX_USE_CUDA)