mirror of
				https://github.com/ml-explore/mlx.git
				synced 2025-10-31 16:21:27 +08:00 
			
		
		
		
	Improvements in the quantizer and dequantization kernel (#1061)
This commit is contained in:
		 Angelos Katharopoulos
					Angelos Katharopoulos
				
			
				
					committed by
					
						 GitHub
						GitHub
					
				
			
			
				
	
			
			
			 GitHub
						GitHub
					
				
			
						parent
						
							7f7b9662ea
						
					
				
				
					commit
					17f57df797
				
			| @@ -16,7 +16,7 @@ class TestQuantized(mlx_tests.MLXTestCase): | ||||
|                 w_hat = mx.dequantize(w_q, scales, biases, gs, b) | ||||
|                 errors = (w - w_hat).abs().reshape(*scales.shape, -1) | ||||
|                 eps = 1e-6 | ||||
|                 self.assertTrue((2 * errors <= (scales[..., None] + eps)).all()) | ||||
|                 self.assertTrue((errors <= (scales[..., None] + eps).abs()).all()) | ||||
|  | ||||
|         # test quantize/dequantize 0s | ||||
|         a = mx.zeros((256, 512)) | ||||
|   | ||||
		Reference in New Issue
	
	Block a user