[CUDA] Quantized refactoring (#2442)

This commit is contained in:
Angelos Katharopoulos
2025-07-30 08:27:20 -07:00
committed by GitHub
parent 2204182bba
commit 3bf81ed1bd
5 changed files with 246 additions and 140 deletions

View File

@@ -46,7 +46,8 @@ target_sources(
${CMAKE_CURRENT_SOURCE_DIR}/ternary.cu
${CMAKE_CURRENT_SOURCE_DIR}/unary.cu
${CMAKE_CURRENT_SOURCE_DIR}/utils.cpp
${CMAKE_CURRENT_SOURCE_DIR}/quantized.cu
${CMAKE_CURRENT_SOURCE_DIR}/quantized/affine_quantize.cu
${CMAKE_CURRENT_SOURCE_DIR}/quantized/quantized.cpp
${CMAKE_CURRENT_SOURCE_DIR}/worker.cpp)
if(CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 12.9.0)