[CUDA] RMSNorm and VJP (#2280)

* rms norm start

* nit
This commit is contained in:
Awni Hannun
2025-06-12 17:09:49 -07:00
committed by GitHub
parent a4fc671d3e
commit 918761a25a
4 changed files with 345 additions and 4 deletions

View File

@@ -30,6 +30,7 @@ target_sources(
${CMAKE_CURRENT_SOURCE_DIR}/reduce/col_reduce.cu
${CMAKE_CURRENT_SOURCE_DIR}/reduce/row_reduce.cu
${CMAKE_CURRENT_SOURCE_DIR}/reduce/segmented_reduce.cu
${CMAKE_CURRENT_SOURCE_DIR}/rms_norm.cu
${CMAKE_CURRENT_SOURCE_DIR}/slicing.cpp
${CMAKE_CURRENT_SOURCE_DIR}/softmax.cu
${CMAKE_CURRENT_SOURCE_DIR}/sort.cu