Awni Hannun 
							
						 
					 
					
						
						
							
						
						4fda5fbdf9 
					 
					
						
						
							
							add python testing for cuda with ability to skip list of tests ( #2295 )  
						
						 
						
						
						
						
					 
					
						2025-06-15 10:56:48 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Angelos Katharopoulos 
							
						 
					 
					
						
						
							
						
						8590c0941e 
					 
					
						
						
							
							Add load_safe to the general conv loaders ( #2258 )  
						
						 
						
						
						
						
					 
					
						2025-06-10 20:58:16 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						8576e6fe36 
					 
					
						
						
							
							fix conv2d bug + faster conv 1d ( #2195 )  
						
						 
						
						... 
						
						
						
						* fix conv2d bug + faster conv 1d
* revert sort + flaky test 
						
						
					 
					
						2025-05-18 06:05:11 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						602f43e3d1 
					 
					
						
						
							
							fix conv grad ( #2187 )  
						
						 
						
						
						
						
					 
					
						2025-05-15 19:20:36 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								ATurker 
							
						 
					 
					
						
						
							
						
						a7fae8a176 
					 
					
						
						
							
							fix: conv_general differences between gpu, cpu ( #2070 )  
						
						 
						
						... 
						
						
						
						* fix general_conv padding
* fix bugs
* add test
---------
Co-authored-by: Awni Hannun <awni@apple.com > 
						
						
					 
					
						2025-05-09 10:26:52 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Jagrit Digani 
							
						 
					 
					
						
						
							
						
						8777fd104f 
					 
					
						
						
							
							Depthwise Conv2D optimization ( #2036 )  
						
						 
						
						... 
						
						
						
						- Add new specialized kernel for small kernel (kernels size <= 7), small strides (strides <= 2) depthwise 2d convolutions
- Add related tests 
						
						
					 
					
						2025-04-03 09:42:04 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Angelos Katharopoulos 
							
						 
					 
					
						
						
							
						
						71de73a668 
					 
					
						
						
							
							Fix convs by reverting  #1803  ( #1882 )  
						
						 
						
						
						
						
					 
					
						2025-02-18 14:36:34 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Jagrit Digani 
							
						 
					 
					
						
						
							
						
						2dc307f2e6 
					 
					
						
						
							
							Winograd Update for Small batches  ( #1803 )  
						
						 
						
						... 
						
						
						
						* Build in padding to Winograd kernels
* Add new fused Winograd kernel
* Enable weight flipping in Winograd kernels 
						
						
					 
					
						2025-02-14 13:08:13 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						af1b725fda 
					 
					
						
						
							
							Fix a couple of slicing bugs ( #1827 )  
						
						 
						
						... 
						
						
						
						* fix a few bugs
* fix conv grad
* speedup test
* comment 
						
						
					 
					
						2025-02-05 19:50:08 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						1017ac4a9e 
					 
					
						
						
							
							add dilation for conv 3d layers + test for 3d conv w/ dilation ( #1802 )  
						
						 
						
						
						
						
					 
					
						2025-01-28 06:17:07 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						0070e1db40 
					 
					
						
						
							
							Fix deep recursion with siblings ( #1462 )  
						
						 
						
						... 
						
						
						
						* fix recursion with siblings
* fix
* add test
* increase tol 
						
						
					 
					
						2024-10-07 06:15:33 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						e4534dac17 
					 
					
						
						
							
							Conv grad with groups + bugfix ( #1449 )  
						
						 
						
						... 
						
						
						
						* fix bug in flipped conv with groups, start of grad for groups
* fix
* fix
* fix + test 
						
						
					 
					
						2024-10-06 07:08:53 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Max-Heinrich Laves 
							
						 
					 
					
						
						
							
						
						efeb9c0f02 
					 
					
						
						
							
							Transposed Convolution ( #1245 )  
						
						 
						
						... 
						
						
						
						* initial implementation for conv_transpose
ran pre-commit
implemented conv_transpose
updated conv_general docstring
updated conv_general docstring
updated code comments
removed commented run_conv_checks
updated acknowledgments
added missing entry to ops.rst
added op to nn.layers
resolved merge conflicts
* removed ConvolutionTranspose primitive as suggested by reviewer
removed ConvolutionTranspose primitive as suggested by reviewer
* remove transpose flag, add another test
---------
Co-authored-by: Awni Hannun <awni@apple.com > 
						
						
					 
					
						2024-09-06 19:52:38 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						58d0e199e1 
					 
					
						
						
							
							add bfloat conv for windograd ( #1306 )  
						
						 
						
						... 
						
						
						
						* add bfloat conv for windograd
* accumulate in fp32
* accumulate in fp32
* accumulate in bf16 
						
						
					 
					
						2024-08-05 15:51:13 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Nikhil Mehta 
							
						 
					 
					
						
						
							
						
						0b7d71fd2f 
					 
					
						
						
							
							Add softmin, hardshrink, hardtanh ( #1180 )  
						
						 
						
						... 
						
						
						
						---------
Co-authored-by: Nikhil Mehta <nikmehta@tesla.com > 
						
						
					 
					
						2024-06-04 15:48:18 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Rifur13 
							
						 
					 
					
						
						
							
						
						9401507336 
					 
					
						
						
							
							Add groups to 2-D convolutions ( #1129 )  
						
						 
						
						... 
						
						
						
						* Added groups to 2-D convolutions. Only implemented for **some** specializations.
Also fixed 1D grouped convs with different kernel strides and added more tests.
* fix channels condition 
						
						
					 
					
						2024-05-22 20:01:44 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Max-Heinrich Laves 
							
						 
					 
					
						
						
							
						
						ff4223904d 
					 
					
						
						
							
							Conv3d ( #993 )  
						
						 
						
						... 
						
						
						
						* added conv3d
added conv3d
implemented explicit_gemm_conv_ND_cpu and bounds checks for slow_conv_3D
* incorporated reviewer comments
* fixed test
* reduced tensor shapes in test for conv3d
* Reviewer suggestion
Co-authored-by: Awni Hannun <awni.hannun@gmail.com >
Reviewer suggestion
Co-authored-by: Awni Hannun <awni.hannun@gmail.com >
Reviewer suggestion
Co-authored-by: Awni Hannun <awni.hannun@gmail.com >
Reviewer suggestion 
						
						
					 
					
						2024-05-11 06:15:02 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Rifur13 
							
						 
					 
					
						
						
							
						
						c4a471c99d 
					 
					
						
						
							
							Add groups to Conv1d ( #948 )  
						
						 
						
						... 
						
						
						
						* Add conv1d grouped convs on CPU
* Add GPU support
* Parallelize inside metal kernel
* clenaup
* Update mlx/ops.cpp
Co-authored-by: Awni Hannun <awni.hannun@gmail.com >
* New unfold kernel + remove unused code
* Remove copy and refactor
* Update vjp and reuse steel gemm
* Fixed groups on cpu
* Fix metal validation
---------
Co-authored-by: Awni Hannun <awni.hannun@gmail.com > 
						
						
					 
					
						2024-04-27 06:24:57 -07:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Jagrit Digani 
							
						 
					 
					
						
						
							
						
						776c3d226d 
					 
					
						
						
							
							Convolution update  ( #651 )  
						
						 
						
						... 
						
						
						
						* Init steel conv and update Conv primitive
* Update slow CPU implementation to support flipping and input dilation winograd conv routing
Co-authored-by: Awni Hannun <awni@apple.com > 
						
						
					 
					
						2024-02-28 20:11:16 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						09b9275027 
					 
					
						
						
							
							Make shape a tuple ( #591 )  
						
						 
						
						... 
						
						
						
						* shape tuple
* also remove simplify from docs
* rebase 
						
						
					 
					
						2024-01-30 13:11:01 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Zach Schillaci 
							
						 
					 
					
						
						
							
						
						5b9be57ac3 
					 
					
						
						
							
							Add isort pre-commit and run ( #68 )  
						
						 
						
						
						
						
					 
					
						2023-12-08 11:31:47 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Awni Hannun 
							
						 
					 
					
						
						
							
						
						46a39e5b1f 
					 
					
						
						
							
							copyright + ack  
						
						 
						
						
						
						
					 
					
						2023-11-30 11:12:53 -08:00  
					
					
						 
						
						
							
							
							 
							
							
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Jagrit Digani 
							
						 
					 
					
						
						
							
						
						e6306cfee9 
					 
					
						
						
							
							jagrit's commit files  
						
						 
						
						
						
						
					 
					
						2023-11-29 10:52:08 -08:00