mirror of
https://github.com/ml-explore/mlx.git
synced 2025-06-24 01:17:26 +08:00
Commit Graph
Select branches
Hide Pull Requests
ab-nf4-quant
alternative_fence
async_all_reduce
attn-update
checkpoint_module
compile-test
cpp20
cuda-reduce
cuda-sdpa-vector
cuda_available
dynamic_reshape
fences_must_exit
fft
gemm-tuner
gguf_q4_k
gh-pages
gs16
interrupt_eval
io-dev
main
mat-attn
more_donation
packed-quants
priority-queue-eval
q-sdpa
quantized-kv-update
raw-sockets-distributed
sdpa-test
socket-distributed-layers
socket-distributed-layers-gloo
sockets-distributed
split_logsumexp
steel-refactor
stop-fence-term
trellis-quants
winograd_qupdate
#1
#1000
#1002
#1003
#1006
#1007
#1010
#1011
#1014
#1016
#1018
#1019
#102
#1020
#1028
#1030
#1032
#1034
#1035
#1036
#1037
#1038
#1039
#104
#1043
#1053
#1054
#1058
#1059
#1060
#1061
#1064
#1067
#1070
#1074
#1077
#1079
#108
#1081
#1085
#1087
#109
#1091
#1092
#1093
#1097
#1098
#1099
#11
#110
#1100
#1101
#1102
#1104
#1105
#1109
#111
#1110
#1111
#1112
#1113
#1114
#1115
#1116
#1117
#1118
#1119
#1120
#1122
#1123
#1124
#1125
#1126
#1129
#1131
#1132
#1135
#1136
#1137
#1138
#1139
#1140
#1141
#1142
#1147
#1149
#115
#1150
#1151
#1152
#1154
#1157
#116
#1161
#1165
#1167
#1168
#1169
#117
#1172
#1174
#1175
#1176
#1177
#1178
#1179
#118
#1180
#1183
#1184
#1185
#1188
#1189
#119
#1190
#1191
#1194
#1195
#1199
#120
#1200
#1202
#1203
#1204
#1205
#1206
#1208
#1209
#121
#1211
#1212
#1215
#1216
#122
#1221
#1222
#1224
#1227
#1228
#123
#1235
#1236
#1237
#1239
#1242
#1243
#1245
#1246
#1247
#1249
#125
#1252
#1253
#1256
#1260
#1262
#1262
#1263
#1264
#1266
#1268
#1269
#1270
#1273
#1274
#1275
#1278
#1279
#128
#1280
#1281
#1282
#1283
#1285
#1287
#1289
#1291
#1297
#1298
#1299
#1300
#1301
#1304
#1305
#1306
#1307
#1309
#131
#1310
#1314
#1315
#1316
#1318
#1319
#1320
#1323
#1325
#1326
#1327
#1329
#133
#1330
#1332
#1333
#1334
#1336
#1337
#1339
#1340
#1343
#1344
#1346
#1347
#1348
#1349
#1350
#1351
#1352
#1353
#1355
#1356
#1358
#1359
#136
#1360
#1361
#1362
#1365
#1366
#1367
#1368
#1369
#137
#1371
#1372
#1373
#1374
#1376
#1379
#138
#1381
#1383
#1384
#1385
#1387
#1389
#139
#1390
#1391
#1394
#1395
#1396
#1397
#1401
#1402
#1403
#1404
#1405
#1407
#1408
#1410
#1412
#1414
#1415
#1416
#1417
#1418
#1419
#142
#1420
#1421
#1425
#143
#1430
#1431
#1434
#1436
#1437
#144
#1440
#1442
#1444
#1445
#1446
#1447
#1449
#145
#1450
#1451
#1452
#1453
#1455
#1456
#1460
#1461
#1462
#1468
#1470
#1471
#1476
#1477
#1478
#1479
#1482
#1485
#1486
#1488
#149
#1490
#1491
#1492
#1493
#1495
#1496
#1497
#1498
#150
#1501
#1502
#1503
#1506
#1508
#1509
#1510
#1514
#1515
#1515
#1518
#1519
#1521
#1522
#1523
#1524
#1525
#1526
#1528
#1529
#1532
#1534
#1535
#1537
#1539
#1541
#1543
#1545
#1546
#1548
#1550
#1551
#1553
#1555
#1556
#1557
#1558
#156
#1561
#1562
#1563
#1564
#1565
#1566
#1568
#1569
#157
#1570
#1572
#1574
#1575
#1577
#1578
#1579
#158
#1584
#1587
#1589
#159
#1590
#1591
#1594
#1595
#1596
#1597
#1600
#1601
#1603
#1606
#1607
#1609
#161
#1610
#1612
#1613
#1615
#1616
#1617
#1620
#1625
#1626
#1627
#1628
#1629
#1630
#1632
#1634
#1635
#1637
#1638
#1639
#1640
#1642
#1644
#1645
#1646
#1650
#1651
#1652
#1653
#1654
#1655
#1656
#1657
#1658
#1659
#166
#1660
#1661
#1662
#1663
#1664
#1665
#1666
#1667
#1668
#167
#1671
#1672
#1673
#1674
#1675
#1677
#1678
#1679
#1680
#1681
#1682
#1683
#1684
#1685
#1687
#1688
#1689
#1690
#1691
#1692
#1693
#1694
#1695
#1696
#1697
#1698
#1699
#170
#1700
#1701
#1702
#1704
#1705
#1706
#1708
#1709
#1710
#1714
#1715
#1716
#1718
#1719
#1721
#1722
#1723
#1724
#1726
#1727
#1728
#1731
#1732
#1733
#1735
#1736
#1737
#1738
#1740
#1741
#1742
#1743
#1745
#1746
#1747
#1748
#1749
#1750
#1752
#1753
#1754
#1755
#1756
#1757
#1758
#1759
#1760
#1761
#1762
#1763
#1764
#1765
#1768
#1772
#1773
#1774
#1775
#1776
#1777
#1782
#1783
#1784
#1788
#1789
#1789
#1793
#1795
#1797
#1798
#1799
#1801
#1802
#1803
#1805
#1806
#181
#1810
#1811
#1812
#1813
#1814
#1816
#1817
#1819
#1820
#1822
#1825
#1827
#1829
#183
#1830
#1831
#1833
#1834
#1835
#1836
#1837
#1838
#184
#1840
#1843
#1844
#1845
#1848
#185
#1852
#1854
#1856
#1857
#1858
#1859
#186
#1860
#1861
#1862
#1863
#1864
#1865
#1866
#1867
#1869
#187
#1870
#1874
#1875
#1876
#1879
#1882
#1883
#1884
#1885
#1887
#1889
#189
#1890
#1892
#1894
#1896
#1897
#1898
#1899
#190
#1900
#1901
#1902
#1904
#1906
#1911
#1913
#1914
#1915
#1916
#1917
#1920
#1921
#1921
#1922
#1923
#1924
#1925
#1926
#1928
#1929
#1931
#1932
#1935
#1936
#1937
#1938
#1939
#1940
#1943
#1944
#1948
#1949
#195
#1950
#1952
#1953
#1955
#1957
#196
#1961
#1962
#1966
#1968
#1969
#1970
#1970
#1972
#1973
#1974
#1975
#1976
#1978
#198
#1980
#1981
#1982
#1983
#1985
#1986
#1987
#1988
#1989
#199
#1990
#1991
#1992
#1995
#1996
#1997
#1998
#1999
#2
#2000
#2004
#2005
#2006
#2007
#2008
#2009
#2011
#2012
#2013
#2014
#2016
#2017
#2018
#202
#2020
#2021
#2024
#2025
#2026
#2027
#2028
#2029
#203
#2031
#2032
#2033
#2035
#2036
#2040
#2041
#2042
#2043
#2044
#2045
#2046
#2047
#2048
#2049
#205
#2051
#2052
#2053
#2054
#2055
#2058
#2059
#2060
#2061
#2062
#2065
#2066
#2068
#2069
#207
#2070
#2071
#2072
#2073
#2074
#2074
#2075
#2078
#2079
#2080
#2081
#2082
#2087
#209
#2090
#2091
#2092
#2094
#2095
#210
#2100
#2101
#2102
#2104
#2104
#2109
#211
#2110
#2114
#2117
#2119
#2121
#2123
#2128
#2129
#2131
#2135
#2136
#2138
#2139
#2141
#2142
#2143
#2145
#2147
#2148
#215
#2150
#2151
#2152
#2153
#2156
#2156
#2157
#2158
#2160
#2161
#2162
#217
#2172
#2173
#2176
#2177
#2178
#2179
#2181
#2182
#2183
#2187
#2188
#2189
#2191
#2192
#2193
#2195
#22
#2201
#2202
#2204
#2206
#2207
#2209
#221
#2210
#2213
#2214
#2215
#2215
#2216
#2217
#2219
#2219
#222
#2220
#2221
#2223
#2225
#2226
#2230
#2231
#2232
#2234
#2234
#2237
#2239
#224
#2240
#2241
#2242
#2243
#2244
#2246
#2247
#2248
#225
#2250
#2255
#2256
#2258
#2259
#226
#2260
#2261
#2262
#2263
#2264
#2265
#2268
#2269
#227
#2270
#2271
#2272
#2274
#2275
#2276
#2277
#228
#2280
#2282
#2283
#2284
#2286
#2287
#2288
#2289
#2290
#2290
#2291
#2293
#2294
#2294
#2295
#2296
#2297
#2297
#2298
#2299
#230
#2300
#2300
#2302
#2303
#2304
#2306
#2307
#2308
#232
#233
#235
#240
#244
#245
#247
#249
#250
#252
#254
#255
#256
#26
#260
#261
#263
#268
#274
#275
#276
#277
#278
#280
#281
#284
#289
#29
#292
#295
#298
#299
#3
#302
#304
#305
#306
#307
#308
#309
#310
#311
#312
#313
#315
#316
#317
#318
#319
#32
#323
#324
#325
#327
#329
#330
#332
#334
#335
#336
#337
#339
#34
#340
#342
#344
#345
#347
#348
#349
#350
#352
#353
#354
#355
#356
#357
#358
#359
#36
#364
#366
#370
#371
#373
#374
#375
#379
#38
#380
#381
#382
#383
#384
#385
#386
#388
#389
#390
#391
#392
#394
#395
#397
#398
#4
#401
#405
#406
#409
#411
#412
#414
#415
#418
#419
#421
#423
#424
#425
#426
#427
#428
#430
#431
#432
#433
#435
#438
#441
#443
#444
#445
#446
#447
#448
#449
#453
#455
#456
#457
#458
#461
#462
#463
#47
#470
#472
#473
#475
#476
#477
#478
#479
#480
#481
#482
#484
#489
#490
#492
#494
#497
#498
#5
#50
#500
#501
#505
#507
#508
#510
#511
#512
#513
#514
#517
#519
#520
#521
#523
#524
#525
#526
#527
#53
#533
#536
#537
#539
#541
#543
#55
#552
#554
#558
#559
#56
#560
#561
#562
#563
#564
#565
#569
#571
#579
#58
#581
#584
#588
#59
#591
#592
#595
#599
#6
#601
#602
#603
#604
#607
#608
#612
#613
#614
#616
#619
#62
#620
#622
#623
#624
#625
#626
#627
#629
#630
#631
#634
#635
#637
#638
#639
#64
#641
#643
#645
#647
#648
#651
#653
#656
#658
#659
#660
#661
#662
#663
#664
#667
#670
#674
#675
#676
#677
#678
#679
#68
#681
#682
#683
#684
#685
#686
#687
#688
#689
#69
#691
#692
#694
#696
#697
#698
#699
#7
#70
#702
#703
#704
#705
#706
#707
#708
#709
#710
#711
#713
#715
#716
#717
#718
#72
#721
#723
#727
#729
#730
#735
#737
#739
#74
#740
#744
#745
#747
#749
#75
#752
#759
#760
#761
#763
#764
#766
#768
#771
#776
#777
#778
#78
#78
#782
#783
#784
#785
#786
#787
#788
#79
#790
#791
#792
#793
#794
#796
#797
#8
#80
#800
#801
#802
#803
#804
#805
#806
#807
#809
#81
#812
#813
#816
#818
#819
#820
#821
#822
#823
#824
#826
#828
#829
#831
#835
#836
#838
#839
#84
#841
#843
#844
#848
#849
#85
#850
#852
#853
#858
#859
#861
#862
#863
#864
#867
#869
#87
#870
#871
#872
#874
#875
#876
#877
#879
#88
#880
#881
#883
#886
#889
#89
#890
#891
#892
#893
#894
#895
#897
#899
#9
#90
#901
#902
#903
#904
#905
#906
#907
#91
#911
#915
#916
#917
#919
#92
#920
#921
#923
#924
#925
#926
#929
#932
#933
#934
#94
#940
#941
#942
#944
#947
#948
#949
#950
#951
#952
#953
#955
#956
#957
#958
#960
#961
#962
#964
#967
#969
#970
#971
#972
#973
#974
#975
#976
#977
#978
#979
#98
#980
#981
#982
#984
#986
#987
#988
#989
#99
#991
#992
#993
#994
#998
v0.0.10
v0.0.11
v0.0.2
v0.0.3
v0.0.4
v0.0.5
v0.0.6
v0.0.7
v0.0.9
v0.1.0
v0.10.0
v0.11.0
v0.11.1
v0.12.0
v0.12.1
v0.12.2
v0.13.0
v0.13.1
v0.14.0
v0.14.1
v0.15.0
v0.15.1
v0.15.2
v0.16.0
v0.16.1
v0.16.2
v0.16.3
v0.17.0
v0.17.1
v0.17.2
v0.17.3
v0.18.0
v0.18.1
v0.19.0
v0.19.1
v0.19.2
v0.19.3
v0.2.0
v0.20.0
v0.21.0
v0.21.1
v0.22.0
v0.22.1
v0.23.0
v0.23.1
v0.23.2
v0.24.0
v0.24.1
v0.24.2
v0.25.0
v0.25.1
v0.25.2
v0.26.0
v0.26.1
v0.3.0
v0.4.0
v0.5.0
v0.5.1
v0.6.0
v0.7.0
v0.8.0
v0.8.1
v0.9.0
v0.9.1
Select branches
Hide Pull Requests
ab-nf4-quant
alternative_fence
async_all_reduce
attn-update
checkpoint_module
compile-test
cpp20
cuda-reduce
cuda-sdpa-vector
cuda_available
dynamic_reshape
fences_must_exit
fft
gemm-tuner
gguf_q4_k
gh-pages
gs16
interrupt_eval
io-dev
main
mat-attn
more_donation
packed-quants
priority-queue-eval
q-sdpa
quantized-kv-update
raw-sockets-distributed
sdpa-test
socket-distributed-layers
socket-distributed-layers-gloo
sockets-distributed
split_logsumexp
steel-refactor
stop-fence-term
trellis-quants
winograd_qupdate
#1
#1000
#1002
#1003
#1006
#1007
#1010
#1011
#1014
#1016
#1018
#1019
#102
#1020
#1028
#1030
#1032
#1034
#1035
#1036
#1037
#1038
#1039
#104
#1043
#1053
#1054
#1058
#1059
#1060
#1061
#1064
#1067
#1070
#1074
#1077
#1079
#108
#1081
#1085
#1087
#109
#1091
#1092
#1093
#1097
#1098
#1099
#11
#110
#1100
#1101
#1102
#1104
#1105
#1109
#111
#1110
#1111
#1112
#1113
#1114
#1115
#1116
#1117
#1118
#1119
#1120
#1122
#1123
#1124
#1125
#1126
#1129
#1131
#1132
#1135
#1136
#1137
#1138
#1139
#1140
#1141
#1142
#1147
#1149
#115
#1150
#1151
#1152
#1154
#1157
#116
#1161
#1165
#1167
#1168
#1169
#117
#1172
#1174
#1175
#1176
#1177
#1178
#1179
#118
#1180
#1183
#1184
#1185
#1188
#1189
#119
#1190
#1191
#1194
#1195
#1199
#120
#1200
#1202
#1203
#1204
#1205
#1206
#1208
#1209
#121
#1211
#1212
#1215
#1216
#122
#1221
#1222
#1224
#1227
#1228
#123
#1235
#1236
#1237
#1239
#1242
#1243
#1245
#1246
#1247
#1249
#125
#1252
#1253
#1256
#1260
#1262
#1262
#1263
#1264
#1266
#1268
#1269
#1270
#1273
#1274
#1275
#1278
#1279
#128
#1280
#1281
#1282
#1283
#1285
#1287
#1289
#1291
#1297
#1298
#1299
#1300
#1301
#1304
#1305
#1306
#1307
#1309
#131
#1310
#1314
#1315
#1316
#1318
#1319
#1320
#1323
#1325
#1326
#1327
#1329
#133
#1330
#1332
#1333
#1334
#1336
#1337
#1339
#1340
#1343
#1344
#1346
#1347
#1348
#1349
#1350
#1351
#1352
#1353
#1355
#1356
#1358
#1359
#136
#1360
#1361
#1362
#1365
#1366
#1367
#1368
#1369
#137
#1371
#1372
#1373
#1374
#1376
#1379
#138
#1381
#1383
#1384
#1385
#1387
#1389
#139
#1390
#1391
#1394
#1395
#1396
#1397
#1401
#1402
#1403
#1404
#1405
#1407
#1408
#1410
#1412
#1414
#1415
#1416
#1417
#1418
#1419
#142
#1420
#1421
#1425
#143
#1430
#1431
#1434
#1436
#1437
#144
#1440
#1442
#1444
#1445
#1446
#1447
#1449
#145
#1450
#1451
#1452
#1453
#1455
#1456
#1460
#1461
#1462
#1468
#1470
#1471
#1476
#1477
#1478
#1479
#1482
#1485
#1486
#1488
#149
#1490
#1491
#1492
#1493
#1495
#1496
#1497
#1498
#150
#1501
#1502
#1503
#1506
#1508
#1509
#1510
#1514
#1515
#1515
#1518
#1519
#1521
#1522
#1523
#1524
#1525
#1526
#1528
#1529
#1532
#1534
#1535
#1537
#1539
#1541
#1543
#1545
#1546
#1548
#1550
#1551
#1553
#1555
#1556
#1557
#1558
#156
#1561
#1562
#1563
#1564
#1565
#1566
#1568
#1569
#157
#1570
#1572
#1574
#1575
#1577
#1578
#1579
#158
#1584
#1587
#1589
#159
#1590
#1591
#1594
#1595
#1596
#1597
#1600
#1601
#1603
#1606
#1607
#1609
#161
#1610
#1612
#1613
#1615
#1616
#1617
#1620
#1625
#1626
#1627
#1628
#1629
#1630
#1632
#1634
#1635
#1637
#1638
#1639
#1640
#1642
#1644
#1645
#1646
#1650
#1651
#1652
#1653
#1654
#1655
#1656
#1657
#1658
#1659
#166
#1660
#1661
#1662
#1663
#1664
#1665
#1666
#1667
#1668
#167
#1671
#1672
#1673
#1674
#1675
#1677
#1678
#1679
#1680
#1681
#1682
#1683
#1684
#1685
#1687
#1688
#1689
#1690
#1691
#1692
#1693
#1694
#1695
#1696
#1697
#1698
#1699
#170
#1700
#1701
#1702
#1704
#1705
#1706
#1708
#1709
#1710
#1714
#1715
#1716
#1718
#1719
#1721
#1722
#1723
#1724
#1726
#1727
#1728
#1731
#1732
#1733
#1735
#1736
#1737
#1738
#1740
#1741
#1742
#1743
#1745
#1746
#1747
#1748
#1749
#1750
#1752
#1753
#1754
#1755
#1756
#1757
#1758
#1759
#1760
#1761
#1762
#1763
#1764
#1765
#1768
#1772
#1773
#1774
#1775
#1776
#1777
#1782
#1783
#1784
#1788
#1789
#1789
#1793
#1795
#1797
#1798
#1799
#1801
#1802
#1803
#1805
#1806
#181
#1810
#1811
#1812
#1813
#1814
#1816
#1817
#1819
#1820
#1822
#1825
#1827
#1829
#183
#1830
#1831
#1833
#1834
#1835
#1836
#1837
#1838
#184
#1840
#1843
#1844
#1845
#1848
#185
#1852
#1854
#1856
#1857
#1858
#1859
#186
#1860
#1861
#1862
#1863
#1864
#1865
#1866
#1867
#1869
#187
#1870
#1874
#1875
#1876
#1879
#1882
#1883
#1884
#1885
#1887
#1889
#189
#1890
#1892
#1894
#1896
#1897
#1898
#1899
#190
#1900
#1901
#1902
#1904
#1906
#1911
#1913
#1914
#1915
#1916
#1917
#1920
#1921
#1921
#1922
#1923
#1924
#1925
#1926
#1928
#1929
#1931
#1932
#1935
#1936
#1937
#1938
#1939
#1940
#1943
#1944
#1948
#1949
#195
#1950
#1952
#1953
#1955
#1957
#196
#1961
#1962
#1966
#1968
#1969
#1970
#1970
#1972
#1973
#1974
#1975
#1976
#1978
#198
#1980
#1981
#1982
#1983
#1985
#1986
#1987
#1988
#1989
#199
#1990
#1991
#1992
#1995
#1996
#1997
#1998
#1999
#2
#2000
#2004
#2005
#2006
#2007
#2008
#2009
#2011
#2012
#2013
#2014
#2016
#2017
#2018
#202
#2020
#2021
#2024
#2025
#2026
#2027
#2028
#2029
#203
#2031
#2032
#2033
#2035
#2036
#2040
#2041
#2042
#2043
#2044
#2045
#2046
#2047
#2048
#2049
#205
#2051
#2052
#2053
#2054
#2055
#2058
#2059
#2060
#2061
#2062
#2065
#2066
#2068
#2069
#207
#2070
#2071
#2072
#2073
#2074
#2074
#2075
#2078
#2079
#2080
#2081
#2082
#2087
#209
#2090
#2091
#2092
#2094
#2095
#210
#2100
#2101
#2102
#2104
#2104
#2109
#211
#2110
#2114
#2117
#2119
#2121
#2123
#2128
#2129
#2131
#2135
#2136
#2138
#2139
#2141
#2142
#2143
#2145
#2147
#2148
#215
#2150
#2151
#2152
#2153
#2156
#2156
#2157
#2158
#2160
#2161
#2162
#217
#2172
#2173
#2176
#2177
#2178
#2179
#2181
#2182
#2183
#2187
#2188
#2189
#2191
#2192
#2193
#2195
#22
#2201
#2202
#2204
#2206
#2207
#2209
#221
#2210
#2213
#2214
#2215
#2215
#2216
#2217
#2219
#2219
#222
#2220
#2221
#2223
#2225
#2226
#2230
#2231
#2232
#2234
#2234
#2237
#2239
#224
#2240
#2241
#2242
#2243
#2244
#2246
#2247
#2248
#225
#2250
#2255
#2256
#2258
#2259
#226
#2260
#2261
#2262
#2263
#2264
#2265
#2268
#2269
#227
#2270
#2271
#2272
#2274
#2275
#2276
#2277
#228
#2280
#2282
#2283
#2284
#2286
#2287
#2288
#2289
#2290
#2290
#2291
#2293
#2294
#2294
#2295
#2296
#2297
#2297
#2298
#2299
#230
#2300
#2300
#2302
#2303
#2304
#2306
#2307
#2308
#232
#233
#235
#240
#244
#245
#247
#249
#250
#252
#254
#255
#256
#26
#260
#261
#263
#268
#274
#275
#276
#277
#278
#280
#281
#284
#289
#29
#292
#295
#298
#299
#3
#302
#304
#305
#306
#307
#308
#309
#310
#311
#312
#313
#315
#316
#317
#318
#319
#32
#323
#324
#325
#327
#329
#330
#332
#334
#335
#336
#337
#339
#34
#340
#342
#344
#345
#347
#348
#349
#350
#352
#353
#354
#355
#356
#357
#358
#359
#36
#364
#366
#370
#371
#373
#374
#375
#379
#38
#380
#381
#382
#383
#384
#385
#386
#388
#389
#390
#391
#392
#394
#395
#397
#398
#4
#401
#405
#406
#409
#411
#412
#414
#415
#418
#419
#421
#423
#424
#425
#426
#427
#428
#430
#431
#432
#433
#435
#438
#441
#443
#444
#445
#446
#447
#448
#449
#453
#455
#456
#457
#458
#461
#462
#463
#47
#470
#472
#473
#475
#476
#477
#478
#479
#480
#481
#482
#484
#489
#490
#492
#494
#497
#498
#5
#50
#500
#501
#505
#507
#508
#510
#511
#512
#513
#514
#517
#519
#520
#521
#523
#524
#525
#526
#527
#53
#533
#536
#537
#539
#541
#543
#55
#552
#554
#558
#559
#56
#560
#561
#562
#563
#564
#565
#569
#571
#579
#58
#581
#584
#588
#59
#591
#592
#595
#599
#6
#601
#602
#603
#604
#607
#608
#612
#613
#614
#616
#619
#62
#620
#622
#623
#624
#625
#626
#627
#629
#630
#631
#634
#635
#637
#638
#639
#64
#641
#643
#645
#647
#648
#651
#653
#656
#658
#659
#660
#661
#662
#663
#664
#667
#670
#674
#675
#676
#677
#678
#679
#68
#681
#682
#683
#684
#685
#686
#687
#688
#689
#69
#691
#692
#694
#696
#697
#698
#699
#7
#70
#702
#703
#704
#705
#706
#707
#708
#709
#710
#711
#713
#715
#716
#717
#718
#72
#721
#723
#727
#729
#730
#735
#737
#739
#74
#740
#744
#745
#747
#749
#75
#752
#759
#760
#761
#763
#764
#766
#768
#771
#776
#777
#778
#78
#78
#782
#783
#784
#785
#786
#787
#788
#79
#790
#791
#792
#793
#794
#796
#797
#8
#80
#800
#801
#802
#803
#804
#805
#806
#807
#809
#81
#812
#813
#816
#818
#819
#820
#821
#822
#823
#824
#826
#828
#829
#831
#835
#836
#838
#839
#84
#841
#843
#844
#848
#849
#85
#850
#852
#853
#858
#859
#861
#862
#863
#864
#867
#869
#87
#870
#871
#872
#874
#875
#876
#877
#879
#88
#880
#881
#883
#886
#889
#89
#890
#891
#892
#893
#894
#895
#897
#899
#9
#90
#901
#902
#903
#904
#905
#906
#907
#91
#911
#915
#916
#917
#919
#92
#920
#921
#923
#924
#925
#926
#929
#932
#933
#934
#94
#940
#941
#942
#944
#947
#948
#949
#950
#951
#952
#953
#955
#956
#957
#958
#960
#961
#962
#964
#967
#969
#970
#971
#972
#973
#974
#975
#976
#977
#978
#979
#98
#980
#981
#982
#984
#986
#987
#988
#989
#99
#991
#992
#993
#994
#998
v0.0.10
v0.0.11
v0.0.2
v0.0.3
v0.0.4
v0.0.5
v0.0.6
v0.0.7
v0.0.9
v0.1.0
v0.10.0
v0.11.0
v0.11.1
v0.12.0
v0.12.1
v0.12.2
v0.13.0
v0.13.1
v0.14.0
v0.14.1
v0.15.0
v0.15.1
v0.15.2
v0.16.0
v0.16.1
v0.16.2
v0.16.3
v0.17.0
v0.17.1
v0.17.2
v0.17.3
v0.18.0
v0.18.1
v0.19.0
v0.19.1
v0.19.2
v0.19.3
v0.2.0
v0.20.0
v0.21.0
v0.21.1
v0.22.0
v0.22.1
v0.23.0
v0.23.1
v0.23.2
v0.24.0
v0.24.1
v0.24.2
v0.25.0
v0.25.1
v0.25.2
v0.26.0
v0.26.1
v0.3.0
v0.4.0
v0.5.0
v0.5.1
v0.6.0
v0.7.0
v0.8.0
v0.8.1
v0.9.0
v0.9.1
-
8bd4bf2393
Fixes for transpositions and expands
cuda-reduce
Angelos Katharopoulos
2025-06-23 05:49:49 -0700 -
fd1d0821d2
Make sure softmax doesn't change the actual max
Angelos Katharopoulos
2025-06-22 23:34:32 -0700 -
818e8e663e
Add an init reduce
Angelos Katharopoulos
2025-06-22 21:28:41 -0700 -
9d86a4d5ba
b3c1aaafd2
into5adf185f86
John Mai
2025-06-22 14:39:55 +0800 -
cc4b995723
Working col reduce
Angelos Katharopoulos
2025-06-21 23:39:40 -0700 -
664d8e42b8
Add comments and clean up
Angelos Katharopoulos
2025-06-21 12:44:26 -0700 -
abdb21f27c
Add helpers and atomic kernel
Angelos Katharopoulos
2025-06-21 12:37:35 -0700 -
323cc645ab
992eac905a
into5adf185f86
acsweet
2025-06-21 11:11:23 +0200 -
880751a084
Remove segmented reduce and fix row reduce
Angelos Katharopoulos
2025-06-19 02:53:41 -0700 -
cd523ffd9f
Working row reduce looped
Angelos Katharopoulos
2025-06-19 02:42:15 -0700 -
4d2b682a13
Simple row reduce
Angelos Katharopoulos
2025-06-18 23:17:16 -0700 -
b70a964cde
Optimize all reduce a bit
Angelos Katharopoulos
2025-06-18 14:33:27 -0700 -
9cf7ef1068
Add all reduce and atomic updates
Angelos Katharopoulos
2025-06-17 23:58:51 -0700 -
ab7c310914
Adapt the torch benchmark to run in CUDA
Angelos Katharopoulos
2025-06-17 15:56:33 -0700 -
382270d8b5
4d68bd3250
into5adf185f86
Eric Buehler
2025-06-21 00:37:59 -0400 -
c4b30485f2
cc4de6a607
into5adf185f86
Nripesh Niketan
2025-06-21 02:23:45 +0100 -
0d371aaffc
043c37cccd
into5adf185f86
Anastasiia Filippova
2025-06-20 19:19:51 -0600 -
5feed6cb77
cb4dc59a9e
into5adf185f86
Arkar Min Aung
2025-06-21 10:45:06 +1000 -
5adf185f86
update_modules()
when providing a subset (#2308) mainAngelos Katharopoulos
2025-06-20 17:19:46 -0700 -
8ec7713893
Fix style
Angelos Katharopoulos
2025-06-20 16:45:00 -0700 -
c9a9180584
Awni Hannun
2025-06-20 14:50:57 -0700 -
90072445e7
Fix the update_modules subset
Angelos Katharopoulos
2025-06-20 14:43:11 -0700 -
de190bfe82
fix
Awni Hannun
2025-06-20 13:24:24 -0700 -
6bb0b254fd
format
Awni Hannun
2025-06-20 13:01:27 -0700 -
1a0e884036
fix adding inputs arrays in matmul / srot
Awni Hannun
2025-06-20 12:56:40 -0700 -
72e21b7d51
perf tuning
Awni Hannun
2025-06-18 16:42:39 -0700 -
043c37cccd
Use last cuda stream instead of new one
Anastasiia Filippova
2025-06-20 16:07:41 +0200 -
755fb4f970
7c99acb799
into76831ed83d
Awni Hannun
2025-06-20 09:17:34 +0800 -
76831ed83d
Awni Hannun
2025-06-19 15:26:36 -0700 -
4749c57bdb
add license
Awni Hannun
2025-06-19 06:22:42 -0700 -
12322095a8
cuda release
Awni Hannun
2025-06-18 08:18:11 -0700 -
64af1f8920
d2e0b0465c
intob3d7b85376
Gaétan Lepage
2025-06-19 01:06:09 +0100 -
cc4de6a607
Increment 2: Implement major ops and add structure similar to cuda
Nripesh Niketan
2025-06-19 00:50:06 +0100 -
ac5adfa963
increment 1: few ops and jit update
Nripesh Niketan
2025-06-19 00:33:57 +0100 -
709e3aa875
9a5d162ebf
intob3d7b85376
DavitGrigoryan132
2025-06-18 13:36:09 +0100 -
b3d7b85376
Angelos Katharopoulos
2025-06-17 23:55:56 -0700 -
445478c98b
eeaf1fa463
intocad5c0241c
Param Thakkar
2025-06-18 10:49:45 +0800 -
fa0615d39b
Make ptx cache settable by environment variable
Angelos Katharopoulos
2025-06-17 15:45:03 -0700 -
cad5c0241c
Awni Hannun
2025-06-17 12:03:25 -0700 -
873cfa292e
fix copy
Awni Hannun
2025-06-17 10:51:09 -0700 -
3d94859ea2
cuda synch properly waits for all tasks to finish and clear
Awni Hannun
2025-06-17 07:20:05 -0700 -
e6ae350999
Deleted comments, renamed the function
Anastasiia Filippova
2025-06-17 08:55:02 +0200 -
b8022c578a
Awni Hannun
2025-06-16 18:49:32 -0700 -
870208eff5
Start sdpa vector
cuda-sdpa-vector
Angelos Katharopoulos
2025-06-15 21:58:34 -0700 -
3e276d6890
divmod, partition, sort fixes
Awni Hannun
2025-06-16 17:12:12 -0700 -
8bb8b76ae4
[Experiment] ROCM backend initial push
Nripesh Niketan
2025-06-16 22:42:56 +0100 -
1fba0176e1
688e421184
intobc53f8293f
Awni Hannun
2025-06-16 14:14:03 -0700 -
74d6ebd4bd
update ackn.
Goekdeniz-Guelmez
2025-06-16 22:49:53 +0200 -
a315af8981
format
Goekdeniz-Guelmez
2025-06-16 22:45:09 +0200 -
3713832e5e
adding test for silu and clipped silu
Goekdeniz-Guelmez
2025-06-16 22:44:13 +0200 -
9cb6df5960
adding to __init__.py
Goekdeniz-Guelmez
2025-06-16 22:36:35 +0200 -
a426880baf
format
Goekdeniz-Guelmez
2025-06-16 22:36:04 +0200 -
60cd4a5a6f
initial commit
Goekdeniz-Guelmez
2025-06-16 22:33:24 +0200 -
bc53f8293f
Awni Hannun
2025-06-16 13:14:46 -0700 -
abcf62ee55
format
Awni Hannun
2025-06-16 12:35:26 -0700 -
ff1f9ca5e8
more bug fixes
Awni Hannun
2025-06-16 12:28:50 -0700 -
70f2baf39f
Removed commented nogpu for all_reduce
Anastasiia Filippova
2025-06-16 19:11:28 +0200 -
71a47bc10d
Deleted useless import
Anastasiia Filippova
2025-06-16 19:08:38 +0200 -
7429613f76
more bug fixes
Awni Hannun
2025-06-16 09:35:58 -0700 -
e9fbdd20fb
Helper function to parse types
Anastasiia Filippova
2025-06-16 18:35:49 +0200 -
c552ff2451
Awni Hannun
2025-06-16 08:45:40 -0700 -
91817a165b
format
Awni Hannun
2025-06-16 07:46:40 -0700 -
14531cb14f
enable more tests
Awni Hannun
2025-06-16 07:45:01 -0700 -
f15a127900
nccl backend (all reduce + init)
Anastasiia Filippova
2025-06-16 14:28:53 +0200 -
85869fda0c
more fixes
Awni Hannun
2025-06-15 20:44:32 -0700 -
b13c7ef8f8
Fix some cuda back-end bugs and enable corresponding tests
Awni Hannun
2025-06-15 13:09:06 -0700 -
4fda5fbdf9
Awni Hannun
2025-06-15 10:56:48 -0700 -
5971bf3506
add python testing for cuda with ability to skip list of tests
Awni Hannun
2025-06-15 08:28:51 -0700 -
580776559b
Angelos Katharopoulos
2025-06-15 06:08:07 -0700 -
b3c1aaafd2
update: format code
John Mai
2025-06-15 17:35:33 +0800 -
989e8bab66
feat: Add benchmarking for ReLUSquared activation function
John Mai
2025-06-15 17:34:10 +0800 -
fe0672a9d2
docs: Update documentation to include ReLUSquared activation function
John Mai
2025-06-15 17:33:58 +0800 -
cbd353bf73
test: Add unit test for ReLUSquared activation function
John Mai
2025-06-15 17:07:33 +0800 -
940f64fe6a
feat: Add ReLUSquared activation function
John Mai
2025-06-15 17:07:22 +0800 -
cb4dc59a9e
feat(benchmarks): add comprehensive SVD performance benchmarks
Arkar Min Aung
2025-06-15 17:51:45 +1000 -
e5c8773371
feat(metal): implement complete Metal SVD with Jacobi algorithm
Arkar Min Aung
2025-06-15 17:44:38 +1000 -
229e3a29a6
Fix random
Angelos Katharopoulos
2025-06-14 23:53:03 -0700 -
bfe105990b
First working CUDA rope
Angelos Katharopoulos
2025-06-14 15:10:40 -0700 -
a14aaa7c9d
Awni Hannun
2025-06-14 17:54:00 -0700 -
3110982b0e
fp16 matmul fix + tf32 env var
Awni Hannun
2025-06-14 07:17:04 -0700 -
c353af5998
fix cuda arg reduce
Awni Hannun
2025-06-14 06:16:09 -0700 -
a6d780154f
Awni Hannun
2025-06-13 22:10:46 -0700 -
ffef01cf68
fix cuda gemm for bf16
Awni Hannun
2025-06-13 20:04:44 -0700 -
6871e2eeb7
Awni Hannun
2025-06-13 19:21:46 -0700 -
f2d0ea0607
fix cuda jit
Awni Hannun
2025-06-13 15:01:16 -0700 -
8402a2acf4
Awni Hannun
2025-06-13 11:13:00 -0700 -
fddb6933e1
Jagrit Digani
2025-06-13 10:44:56 -0700 -
628e36f7d9
fix complex matmul shape
Awni Hannun
2025-06-13 07:42:12 -0700 -
ea451af9a0
Update no copy condition in normalization to account for axis size 1
Jagrit Digani
2025-06-11 09:58:15 -0700 -
53fa981caf
Add architecture gen to device
Jagrit Digani
2025-06-11 09:56:01 -0700 -
b1d95a3880
Some cleanup
Jagrit Digani
2025-06-11 09:43:34 -0700 -
4b02d3e738
Comments and format
Jagrit Digani
2025-06-11 09:35:52 -0700 -
dd5e833068
Update addmm
Jagrit Digani
2025-06-11 09:30:49 -0700 -
b3013042ca
Redirect steel_gemm
Jagrit Digani
2025-06-11 09:26:07 -0700 -
fc2f6bc51c
Refactor AddMM step 1
Jagrit Digani
2025-06-11 09:01:45 -0700 -
9dbaa35be3
Add axpby routing to steel_matmul_regular
Jagrit Digani
2025-06-11 08:54:42 -0700 -
13eccfa887
Redirect steel_gemm_regular
Jagrit Digani
2025-06-11 08:49:07 -0700 -
96a7017442
Rearrange steel_gemm_regular
Jagrit Digani
2025-06-11 08:38:52 -0700 -
c2f1c2a338
Refactor split k axpby
Jagrit Digani
2025-06-11 07:47:56 -0700 -
9fd8eb357c
Refactor splitk step 1
Jagrit Digani
2025-06-11 07:29:36 -0700