From 97afe40b7bdae90d0ceca80f3a97e5ec9a0903a7 Mon Sep 17 00:00:00 2001 From: Angelos Katharopoulos Date: Thu, 7 Aug 2025 00:55:08 -0700 Subject: [PATCH] Remove duplicate register tile --- mlx/backend/cuda/steel/tiles.cuh | 51 -------------------------------- 1 file changed, 51 deletions(-) diff --git a/mlx/backend/cuda/steel/tiles.cuh b/mlx/backend/cuda/steel/tiles.cuh index be6c46648..a2c51ef20 100644 --- a/mlx/backend/cuda/steel/tiles.cuh +++ b/mlx/backend/cuda/steel/tiles.cuh @@ -223,57 +223,6 @@ struct RegisterTile { } }; -/** - * A simple container of multiple Tile16x16. - * - * Provides utility functions for loading and manipulating collections of basic - * tiles. - */ -template -struct RegisterTile { - static constexpr int ROWS = ROWS_; - static constexpr int COLS = COLS_; - static constexpr int TILES_X = COLS / 16; - static constexpr int TILES_Y = ROWS / 16; - - Tile16x16 data[TILES_X * TILES_Y]; - - __device__ inline void fill(T v) { - MLX_UNROLL - for (int i = 0; i < TILES_Y; i++) { - MLX_UNROLL - for (int j = 0; j < TILES_X; j++) { - data[i * TILES_X + j].fill(v); - } - } - } - - template - __device__ inline void - load(Tile& tile, uint32_t base_address, int row, int col) { - MLX_UNROLL - for (int i = 0; i < TILES_Y; i++) { - MLX_UNROLL - for (int j = 0; j < TILES_X; j++) { - data[i * TILES_X + j].load( - tile.loc(base_address, row + i * 16, col + j * 16)); - } - } - } - - template - __device__ inline void store_global(U* x, int N, int row, int col) { - MLX_UNROLL - for (int i = 0; i < TILES_Y; i++) { - MLX_UNROLL - for (int j = 0; j < TILES_X; j++) { - data[i * TILES_X + j].store_global( - x + (row + i * 16) * N + col + j * 16, N); - } - } - } -}; - template struct SharedTile { static constexpr int ROWS = ROWS_;